pushing latest changes before temporary deploy

53fdd7b0 · Love Arreborn · 9677e955 · 53fdd7b0 · 53fdd7b0 · 53fdd7b0
Commit 53fdd7b0 authored 10 months ago by Love Arreborn
--- a/.DS_Store
+++ b/.DS_Store
--- a/coh_metrix/connectives.py
+++ b/coh_metrix/connectives.py
@@ -10,9 +10,14 @@ def run_connectives(doc: Doc) -> dict:
    """

    connectives = doc._.connectives
-    print(connectives)
    n_words = doc._.scream_metrics["surface_metrics"]["n_words"]

+    total = 0
+    for key in connectives:
+        total = connectives[key]
+
+    connectives["CNCAll"] = total
+
    for key in connectives:
        connectives[key] = connectives[key] / n_words * 1000


--- a/pipeline.py
+++ b/pipeline.py
@@ -136,16 +136,9 @@ def run_pipeline(args: str, test: bool) -> list:
        # ================== PARSING ==================
        start_time = time.time()
        doc, node_tree = process_file(filename)
-        # doc = process_file(filename)
        if test:
            time_checker(start_time, "spaCy", timestamps)

-        # pprint.pp(doc._.scream_metrics)
-        # pprint.pp(doc._.coh_metrix)
-        # pprint.pp(doc._.synonyms)
-
-        # return doc
-
        # ================== STILETT ==================
        start_time = time.time()
        simplified_text, sentence_transformations = ud_text_simplifier.simplify_text(
@@ -156,7 +149,7 @@ def run_pipeline(args: str, test: bool) -> list:

        # ================== SYNONYMS ==================
        # start_time = time.time()
-        # synonym_dict = synonyms.run_synonyms(processed['parsed'])
+        # synonym_dict = synonyms.run_synonyms(processed["parsed"])
        # time_checker(start_time, "Synonyms", timestamps)

        result.append(

--- a/scream2/scream2.py
+++ b/scream2/scream2.py
@@ -272,14 +272,6 @@ def scream_metrics(doc: Doc) -> Doc:
        for category in config.CONNECTIVES.keys():
            for connective in config.CONNECTIVES[category]:
                if connective in sent.text:
-                    print(
-                        "Found",
-                        category,
-                        "connective",
-                        connective,
-                        "in sentence",
-                        sent.text,
-                    )
                    connectives[category] += 1

        # unfortunate double looping, unavoidable if we need to skip punctuation

--- a/stilett/helpers.py
+++ b/stilett/helpers.py
@@ -150,20 +150,20 @@ def contains_name_predicate(sentence: Tree) -> bool:
    return False


-def read_collocation_list():
-    """
-    read the list of collocations
-    """
-    collocation_list = []
-    with open("../synonyms_textad/resources/collocations_lmi.txt", "r") as f:
-        for row in f:
-            # splitta först på tab och sen på space
-            collocations = row.split("\t")[0].lower().split(" ")
-            collocation_list.append(collocations)
-    return collocation_list
-
-
-collocation_list = read_collocation_list()
+# def read_collocation_list():
+#     """
+#     read the list of collocations
+#     """
+#     collocation_list = []
+#     with open("../synonyms_textad/resources/collocations_lmi.txt", "r") as f:
+#         for row in f:
+#             # splitta först på tab och sen på space
+#             collocations = row.split("\t")[0].lower().split(" ")
+#             collocation_list.append(collocations)
+#     return collocation_list
+
+
+# collocation_list = read_collocation_list()


 def check_bigram(curr_lemma, next_lemma):