|
@@ -19,7 +19,7 @@ BASE_DIR = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))
|
|
|
LECTION_DIR = os.path.join("EASvZI", "Лекции")
|
|
|
|
|
|
# ссылка для проверки
|
|
|
-url = "http://213.155.192.79:3001/u21-25gavrilenko/EASvZI/src/6b61ce083a7486f58211beef8cb0334ff78db881/%d0%93%d0%b0%d0%b2%d1%80%d0%b8%d0%bb%d0%b5%d0%bd%d0%ba%d0%be.md"
|
|
|
+url = "http://213.155.192.79:3001/u21-25petrov/EASvZI/src/9b20c7ba3e493e4c000da0eacb3954e8ea8cf71a/%d0%9b%d0%b5%d0%ba%d1%86%d0%b8%d0%b8/1.3.100_%d0%9f%d0%be%d1%82%d0%b5%d0%bd%d1%86%d0%b8%d0%b0%d0%bb%d1%8c%d0%bd%d1%8b%d0%b5_%d1%83%d0%b3%d1%80%d0%be%d0%b7%d1%8b_%d0%b1%d0%b5%d0%b7%d0%be%d0%bf%d0%b0%d1%81%d0%bd%d0%be%d1%81%d1%82%d0%b8/%d0%9f%d0%b5%d1%82%d1%80%d0%be%d0%b2.md"
|
|
|
|
|
|
# ------------------------------- / НАСТРОЙКИ ------------
|
|
|
|
|
@@ -174,24 +174,28 @@ for readme_str in readme_list:
|
|
|
variant_uri = variant_uri.replace("),", "")
|
|
|
variant_uri = variant_uri.replace(")", "")
|
|
|
variant_uri = variant_uri.strip()
|
|
|
-
|
|
|
- variant_path = os.path.join(BASE_DIR, LECTION_DIR, variant_uri)
|
|
|
- try:
|
|
|
- with open(variant_path, encoding="utf-8") as f:
|
|
|
- variant_html = f.read()
|
|
|
- except:
|
|
|
- with open(variant_path, encoding="cp1251") as f:
|
|
|
- variant_html = f.read()
|
|
|
-
|
|
|
- variant_tokens, variant_uniq_text = preprocess_text(variant_html)
|
|
|
- print(f"количество уникальных слов варианта: {len(set(variant_tokens))}")
|
|
|
-
|
|
|
- # пересечение множеств
|
|
|
- min_tokens_len = min([len(set(post_tokens)), len(set(variant_tokens))])
|
|
|
- c = list(set(post_tokens) & set(variant_tokens))
|
|
|
- ratio = (1 - (len(c) / min_tokens_len)) * 100
|
|
|
- print(f"количество совпадающих слов: {len(c)} / {ratio:.2f}%")
|
|
|
- print()
|
|
|
+
|
|
|
+ if "youtube" in variant_uri:
|
|
|
+ print("youtube - не проверяем")
|
|
|
+ print()
|
|
|
+ else:
|
|
|
+ variant_path = os.path.join(BASE_DIR, LECTION_DIR, variant_uri)
|
|
|
+ try:
|
|
|
+ with open(variant_path, encoding="utf-8") as f:
|
|
|
+ variant_html = f.read()
|
|
|
+ except:
|
|
|
+ with open(variant_path, encoding="cp1251") as f:
|
|
|
+ variant_html = f.read()
|
|
|
+
|
|
|
+ variant_tokens, variant_uniq_text = preprocess_text(variant_html)
|
|
|
+ print(f"количество уникальных слов варианта: {len(set(variant_tokens))}")
|
|
|
+
|
|
|
+ # пересечение множеств
|
|
|
+ min_tokens_len = min([len(set(post_tokens)), len(set(variant_tokens))])
|
|
|
+ c = list(set(post_tokens) & set(variant_tokens))
|
|
|
+ ratio = (1 - (len(c) / min_tokens_len)) * 100
|
|
|
+ print(f"количество совпадающих слов: {len(c)} / {ratio:.2f}%")
|
|
|
+ print()
|
|
|
|
|
|
if not(lection_exist):
|
|
|
print("Лекция не найдена в readme")
|