зеркало из
https://github.com/ssciwr/AMMICO.git
synced 2025-10-29 13:06:04 +02:00
merge
Этот коммит содержится в:
Коммит
4add286d7d
@ -1,6 +1,6 @@
|
||||
repos:
|
||||
- repo: https://github.com/kynan/nbstripout
|
||||
rev: 0.7.1
|
||||
rev: 0.8.1
|
||||
hooks:
|
||||
- id: nbstripout
|
||||
files: ".ipynb"
|
||||
|
||||
@ -173,8 +173,8 @@
|
||||
"source": [
|
||||
"%pwd\n",
|
||||
"image_dict = ammico.find_files(\n",
|
||||
" path=\"data/errors_Nov24/Error1\",\n",
|
||||
" # path=str(data_path),\n",
|
||||
" # path = \"/content/drive/MyDrive/misinformation-data/\",\n",
|
||||
" path=str(data_path),\n",
|
||||
" limit=15,\n",
|
||||
")"
|
||||
]
|
||||
|
||||
@ -237,6 +237,15 @@ class TextDetector(AnalysisMethod):
|
||||
if not self.subdict["text"]:
|
||||
print("No text found - skipping analysis.")
|
||||
else:
|
||||
# make sure all full stops are followed by whitespace
|
||||
# otherwise googletrans breaks
|
||||
index_stop = self.subdict["text"].find(".")
|
||||
if self.subdict["text"][index_stop + 1] != " ":
|
||||
self.subdict["text"] = (
|
||||
self.subdict["text"][: index_stop + 1]
|
||||
+ " "
|
||||
+ self.subdict["text"][index_stop + 1 :]
|
||||
)
|
||||
self.translate_text()
|
||||
self.remove_linebreaks()
|
||||
if self.analyse_text:
|
||||
|
||||
Загрузка…
x
Ссылка в новой задаче
Block a user