Skip to content

Commit

Permalink
Update tests
Browse files Browse the repository at this point in the history
  • Loading branch information
Olivie Franklova (CZ) authored and Olivie Franklova (CZ) committed May 28, 2024
1 parent ff54010 commit d54c699
Show file tree
Hide file tree
Showing 3 changed files with 66 additions and 60 deletions.
2 changes: 1 addition & 1 deletion .github/workflows/column2Vec_test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -27,5 +27,5 @@ jobs:
- name: Run tests
run: |
pytest test/test_column2Vec.py test/test_column2VecCache.py
pytest test/test_column2Vec.py
2 changes: 1 addition & 1 deletion .github/workflows/py_test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ jobs:
python-tests:
env:
TEST_FILES: test/test_types.py test/test_metadata.py test/test_comparator.py
TEST_FILES: test/test_types.py test/test_metadata.py test/test_comparator.py test/test_column2VecCache.py
name: Run Python Tests
runs-on: ubuntu-latest
steps:
Expand Down
122 changes: 64 additions & 58 deletions test/test_column2VecCache.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,73 +27,74 @@ def setUpClass(self):
files = [fileM2]
self.data = get_nonnumerical_data(files)
for i in self.data:
self.first = self.data[i]
self.first = self.data[i].head(100)
break
cache.set_file("generated/test.csv")
self.model = SentenceTransformer(MODEL)

def setUp(self):
cache.clear_cache()
cache.clear_persistent_cache()
cache.on()

def test_column2vec_as_sentence(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_as_sentence, self.first, model, "a")

second = time_measure_function(column2vec_as_sentence, self.first, model, "a")
first = time_measure_function(column2vec_as_sentence, self.first, self.model, "a")

second = time_measure_function(column2vec_as_sentence, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_as_sentence, self.first, model, "a")
third = time_measure_function(column2vec_as_sentence, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)


def test_column2vec_as_sentence_clean(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_as_sentence_clean, self.first, model, "a")

second = time_measure_function(column2vec_as_sentence_clean, self.first, model, "a")
first = time_measure_function(column2vec_as_sentence_clean, self.first, self.model, "a")

second = time_measure_function(column2vec_as_sentence_clean, self.first, self.model, "a")

cache.off()
third = time_measure_function(column2vec_as_sentence_clean, self.first, model, "a")
third = time_measure_function(column2vec_as_sentence_clean, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)

def test_column2vec_as_sentence_clean_uniq(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, model, "a")

second = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, model, "a")
first = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, self.model, "a")

second = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, model, "a")
third = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)

def test_column2vec_avg(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_avg, self.first, model, "a")

second = time_measure_function(column2vec_avg, self.first, model, "a")
first = time_measure_function(column2vec_avg, self.first, self.model, "a")

second = time_measure_function(column2vec_avg, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_avg, self.first, model, "a")
third = time_measure_function(column2vec_avg, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)


def test_column2vec_weighted_avg(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_weighted_avg, self.first, model, "a")

second = time_measure_function(column2vec_weighted_avg, self.first, model, "a")
first = time_measure_function(column2vec_weighted_avg, self.first, self.model, "a")

second = time_measure_function(column2vec_weighted_avg, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_weighted_avg, self.first, model, "a")
third = time_measure_function(column2vec_weighted_avg, self.first, self.model, "a")

print(f"{first} : {second} : {third}")

Expand All @@ -102,12 +103,12 @@ def test_column2vec_weighted_avg(self):


def test_column2vec_sum(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_sum, self.first, model, "a")

second = time_measure_function(column2vec_sum, self.first, model, "a")
first = time_measure_function(column2vec_sum, self.first, self.model, "a")

second = time_measure_function(column2vec_sum, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_sum, self.first, model, "a")
third = time_measure_function(column2vec_sum, self.first, self.model, "a")

print(f"{first} : {second} : {third}")

Expand All @@ -116,13 +117,13 @@ def test_column2vec_sum(self):


def test_column2vec_weighted_sum(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_weighted_sum, self.first, model, "a")

second = time_measure_function(column2vec_weighted_sum, self.first, model, "a")
first = time_measure_function(column2vec_weighted_sum, self.first, self.model, "a")

second = time_measure_function(column2vec_weighted_sum, self.first, self.model, "a")

cache.off()
third = time_measure_function(column2vec_weighted_sum, self.first, model, "a")
third = time_measure_function(column2vec_weighted_sum, self.first, self.model, "a")

print(f"{first} : {second} : {third}")

Expand All @@ -138,84 +139,89 @@ def setUpClass(self):
# make an array of all the files
files = [fileM2]
self.data = get_nonnumerical_data(files)
skip = True
for i in self.data:
self.first = self.data[i]
if skip:
skip = False
continue
self.first = self.data[i].head(100)
break
cache.set_file("cache_test.csv")
self.model = SentenceTransformer(MODEL)

def setUp(self):
cache.clear_cache()
cache.clear_persistent_cache()
cache.on()

def test_column2vec_as_sentence(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_as_sentence, self.first, model, "a")

first = time_measure_function(column2vec_as_sentence, self.first, self.model, "a")
cache.save_persistently()
cache.clear_cache()

second = time_measure_function(column2vec_as_sentence, self.first, model, "a")
second = time_measure_function(column2vec_as_sentence, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_as_sentence, self.first, model, "a")
third = time_measure_function(column2vec_as_sentence, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)


def test_column2vec_as_sentence_clean(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_as_sentence_clean, self.first, model, "a")

first = time_measure_function(column2vec_as_sentence_clean, self.first, self.model, "a")
cache.save_persistently()
cache.clear_cache()

second = time_measure_function(column2vec_as_sentence_clean, self.first, model, "a")
second = time_measure_function(column2vec_as_sentence_clean, self.first, self.model, "a")

cache.off()
third = time_measure_function(column2vec_as_sentence_clean, self.first, model, "a")
third = time_measure_function(column2vec_as_sentence_clean, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)

def test_column2vec_as_sentence_clean_uniq(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, model, "a")

first = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, self.model, "a")
cache.save_persistently()
cache.clear_cache()

second = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, model, "a")
second = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, model, "a")
third = time_measure_function(column2vec_as_sentence_clean_uniq, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)

def test_column2vec_avg(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_avg, self.first, model, "a")

first = time_measure_function(column2vec_avg, self.first, self.model, "a")
cache.save_persistently()
cache.clear_cache()

second = time_measure_function(column2vec_avg, self.first, model, "a")
second = time_measure_function(column2vec_avg, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_avg, self.first, model, "a")
third = time_measure_function(column2vec_avg, self.first, self.model, "a")

print(f"{first} : {second} : {third}")
self.assertGreater(first, second)
self.assertGreater(third, second)


def test_column2vec_weighted_avg(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_weighted_avg, self.first, model, "a")

first = time_measure_function(column2vec_weighted_avg, self.first, self.model, "a")
cache.save_persistently()
cache.clear_cache()

second = time_measure_function(column2vec_weighted_avg, self.first, model, "a")
second = time_measure_function(column2vec_weighted_avg, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_weighted_avg, self.first, model, "a")
third = time_measure_function(column2vec_weighted_avg, self.first, self.model, "a")

print(f"{first} : {second} : {third}")

Expand All @@ -224,14 +230,14 @@ def test_column2vec_weighted_avg(self):


def test_column2vec_sum(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_sum, self.first, model, "a")

first = time_measure_function(column2vec_sum, self.first, self.model, "a")
cache.save_persistently()
cache.clear_cache()

second = time_measure_function(column2vec_sum, self.first, model, "a")
second = time_measure_function(column2vec_sum, self.first, self.model, "a")
cache.off()
third = time_measure_function(column2vec_sum, self.first, model, "a")
third = time_measure_function(column2vec_sum, self.first, self.model, "a")

print(f"{first} : {second} : {third}")

Expand All @@ -240,15 +246,15 @@ def test_column2vec_sum(self):


def test_column2vec_weighted_sum(self):
model = SentenceTransformer(MODEL)
first = time_measure_function(column2vec_weighted_sum, self.first, model, "a")

first = time_measure_function(column2vec_weighted_sum, self.first, self.model, "a")
cache.save_persistently()
cache.clear_cache()

second = time_measure_function(column2vec_weighted_sum, self.first, model, "a")
second = time_measure_function(column2vec_weighted_sum, self.first, self.model, "a")

cache.off()
third = time_measure_function(column2vec_weighted_sum, self.first, model, "a")
third = time_measure_function(column2vec_weighted_sum, self.first, self.model, "a")

print(f"{first} : {second} : {third}")

Expand Down

0 comments on commit d54c699

Please sign in to comment.