Ignore:
Timestamp:
Jul 30, 2019, 12:24:25 AM (5 years ago)
Author:
Murray Heymann <heymann.murray@…>
Branches:
(u'spielwiese', '17f1d200f27c5bd38f5dfc6e8a0879242279d1d8')
Children:
de88e1d84f18979811df4c3d1dc68f221a3362ef
Parents:
8d8fefe7898bd9e2156488544587049b7107d0c1
Message:
Fix some minor errors
File:
1 edited

Legend:

Unmodified
Added
Removed
  • machine_learning/model/predictor.py

    r8d8fef rfeed60b  
    33"""
    44
    5 import cProfile
     5# import cProfile
    66import os
    77import sys
     
    5656                # dist = vector_distance(x, vec)
    5757                # Dot product is much faster
    58                 dist = -np.dot(x, vec)
     58                dist = -1 * np.dot(x, vec)
    5959                if dist < min_val:
    6060                    min_val = dist
     
    6868
    6969
    70 def main():
     70def basic_vector_tests():
    7171    """
    72     Run some basic tests
     72    Some basic sanity tests
    7373    """
    74     print("Running some tests")
    7574    predictor = HelpPagePredictor()
    76     vector1 = normalise_vector([1, 4, 10])
    77     vector2 = normalise_vector([2, 3, 1])
    78     vector3 = normalise_vector([3, 9, 3])
     75    vector1 = normalise_vector(np.array([1, 4, 10]))
     76    vector2 = normalise_vector(np.array([2, 3, 1]))
     77    vector3 = normalise_vector(np.array([3, 9, 3]))
    7978
    8079    vectors = np.array([vector1, vector2, vector3])
     
    8483    print()
    8584
    86     testvec = normalise_vector([1, 1, 1])
     85    testvec = normalise_vector(np.array([1, 1, 1]))
    8786    print("test vector:")
    8887    print(testvec)
     
    105104    print()
    106105
     106
     107def main():
     108    """
     109    Run some basic tests
     110    """
     111    print("Running some tests")
     112
     113    basic_vector_tests()
     114
    107115    dictionary = read_dictionary(KEYWORDS_FILE)
    108116
     
    113121
    114122    test_vec = count_occurances("extract.lib", dictionary)
     123    predictor = HelpPagePredictor()
    115124    predictor.fit(vectors, file_list)
    116125
     
    124133    print("prediction for zero vector")
    125134    zerovec = np.zeros(len(dictionary) - 2)
    126     print(len(zerovec))
    127135    start = time.time()
    128136    prediction = predictor.predict(np.array([zerovec]))
     
    138146            if not os.path.isfile(sys.argv[i]):
    139147                continue
    140             print ("predicting for file", sys.argv[i])
     148            print("predicting for file", sys.argv[i])
    141149            test_vec = count_occurances(sys.argv[i], dictionary)
    142150            start = time.time()
Note: See TracChangeset for help on using the changeset viewer.