Skip to content

Commit

Permalink
#109 fix all Ruff formatting and linting errors
Browse files Browse the repository at this point in the history
  • Loading branch information
andrewtavis committed Mar 20, 2024
1 parent f86e9ac commit 6ab8d17
Show file tree
Hide file tree
Showing 29 changed files with 76 additions and 51 deletions.
2 changes: 1 addition & 1 deletion .github/workflows/pr_ci.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -46,4 +46,4 @@ jobs:

- name: Run ruff - Linting and import sorting check
if: always()
run: ruff check .
run: ruff check .
5 changes: 2 additions & 3 deletions src/scribe_data/checkquery.py
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,7 @@
"""

import argparse
import contextlib
import math
import os
import subprocess
Expand Down Expand Up @@ -304,12 +305,10 @@ def check_positive_int(value: str, err_msg: str) -> int:
------
argparse.ArgumentTypeError
"""
try:
with contextlib.suppress(ValueError):
number = int(value)
if number >= 1:
return number
except ValueError:
pass

raise argparse.ArgumentTypeError(err_msg)

Expand Down
8 changes: 4 additions & 4 deletions src/scribe_data/extract_transform/extract_wiki.py
Original file line number Diff line number Diff line change
Expand Up @@ -320,9 +320,9 @@ def parse_to_ndjson(
print(f"Making {output_dir} directory for the output")
os.makedirs(output_dir)

if multicore == True:
if multicore:
num_cores = os.cpu_count()
elif multicore == False:
elif not multicore:
num_cores = 1
elif isinstance(multicore, int):
num_cores = multicore
Expand Down Expand Up @@ -372,8 +372,8 @@ def read_and_combine_json(file_path):
data = []

with open(file_path, "r", encoding="utf-8") as f:
for l in f:
data.append(json.loads(l))
for line in f:
data.append(json.loads(line))

return data

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import translate_to_other_languages
from scribe_data.utils import translate_to_other_languages # noqa: E402

SRC_LANG = "English"
translate_script_dir = os.path.dirname(os.path.abspath(__file__))
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,11 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data, map_genders
from scribe_data.utils import ( # noqa: E402
export_formatted_data,
load_queried_data,
map_genders,
)

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import translate_to_other_languages
from scribe_data.utils import translate_to_other_languages # noqa: E402

SRC_LANG = "French"
translate_script_dir = os.path.dirname(os.path.abspath(__file__))
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,11 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data, map_genders
from scribe_data.utils import ( # noqa: E402
export_formatted_data,
load_queried_data,
map_genders,
)

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,11 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data, map_genders
from scribe_data.utils import ( # noqa: E402
export_formatted_data,
load_queried_data,
map_genders,
)

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,11 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data, map_genders
from scribe_data.utils import ( # noqa: E402
export_formatted_data,
load_queried_data,
map_genders,
)

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,11 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data, map_genders
from scribe_data.utils import ( # noqa: E402
export_formatted_data,
load_queried_data,
map_genders,
)

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import translate_to_other_languages
from scribe_data.utils import translate_to_other_languages # noqa: E402

SRC_LANG = "Russian"
translate_script_dir = os.path.dirname(os.path.abspath(__file__))
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,11 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data, map_genders
from scribe_data.utils import ( # noqa: E402
export_formatted_data,
load_queried_data,
map_genders,
)

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,11 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data, map_genders
from scribe_data.utils import ( # noqa: E402
export_formatted_data,
load_queried_data,
map_genders,
)

file_path = sys.argv[0]

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import export_formatted_data, load_queried_data
from scribe_data.utils import export_formatted_data, load_queried_data # noqa: E402

file_path = sys.argv[0]

Expand Down
Empty file.
3 changes: 1 addition & 2 deletions src/scribe_data/extract_transform/process_unicode.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,15 +8,14 @@
import csv
import fileinput
import json
import re
from importlib.resources import files

import emoji
from icu import Char, UProperty
from tqdm.auto import tqdm

from scribe_data.extract_transform.emoji_utils import get_emoji_codes_to_ignore
from scribe_data.load.update_utils import (
from scribe_data.utils import (
get_language_iso,
get_path_from_et_dir,
)
Expand Down
1 change: 0 additions & 1 deletion src/scribe_data/extract_transform/process_wiki.py
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,6 @@
from tqdm.auto import tqdm

from scribe_data.utils import (
get_ios_data_path,
get_language_qid,
get_language_words_to_ignore,
get_language_words_to_remove,
Expand Down
36 changes: 18 additions & 18 deletions src/scribe_data/load/data_to_sqlite.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import get_ios_data_path, get_language_iso
from scribe_data.utils import get_language_iso # noqa: E402

PATH_TO_ET_FILES = "../extract_transform/"

Expand Down Expand Up @@ -76,32 +76,32 @@
languages_update = current_languages if languages is None else languages

language_word_type_dict = {
l: [
lang: [
f.split(".json")[0]
for f in os.listdir(f"{PATH_TO_ET_FILES}{l}/formatted_data")
for f in os.listdir(f"{PATH_TO_ET_FILES}{lang}/formatted_data")
if f.split(".json")[0] in word_types
]
for l in languages_update
for lang in languages_update
}

print(
f"Creating SQLite databases for the following languages: {', '.join(languages_update)}"
)
for l in tqdm(
for lang in tqdm(
language_word_type_dict,
desc="Databases created",
unit="dbs",
):
if language_word_type_dict[l] != []:
if language_word_type_dict[lang] != []:
maybe_over = "" # output string formatting variable (see below)
if os.path.exists(
f"databases/{get_language_iso(l).upper()}LanguageData.sqlite"
f"databases/{get_language_iso(lang).upper()}LanguageData.sqlite"
):
os.remove(f"databases/{get_language_iso(l).upper()}LanguageData.sqlite")
os.remove(f"databases/{get_language_iso(lang).upper()}LanguageData.sqlite")
maybe_over = "over"

connection = sqlite3.connect(
f"databases/{get_language_iso(l).upper()}LanguageData.sqlite"
f"databases/{get_language_iso(lang).upper()}LanguageData.sqlite"
)
cursor = connection.cursor()

Expand Down Expand Up @@ -139,11 +139,11 @@ def table_insert(word_type, keys):
keys,
)

print(f"Database for {l} {maybe_over}written and connection made.")
for wt in language_word_type_dict[l]:
print(f"Creating {l} {wt} table...")
print(f"Database for {lang} {maybe_over}written and connection made.")
for wt in language_word_type_dict[lang]:
print(f"Creating {lang} {wt} table...")
json_data = json.load(
open(f"{PATH_TO_ET_FILES}{l}/formatted_data/{wt}.json")
open(f"{PATH_TO_ET_FILES}{lang}/formatted_data/{wt}.json")
)

if wt == "nouns":
Expand All @@ -153,9 +153,9 @@ def table_insert(word_type, keys):
keys = [row, json_data[row]["plural"], json_data[row]["form"]]
table_insert(word_type=wt, keys=keys)

if "Scribe" not in json_data and l != "Russian":
if "Scribe" not in json_data and lang != "Russian":
table_insert(word_type=wt, keys=["Scribe", "Scribes", ""])
# elif "Писец" not in json_data and l == "Russian":
# elif "Писец" not in json_data and lang == "Russian":
# table_insert(word_type=wt, keys=["Писец", "Писцы", ""])

connection.commit()
Expand Down Expand Up @@ -214,7 +214,7 @@ def table_insert(word_type, keys):
connection.commit()

wt = "autocomplete_lexicon"
print(f"Creating {l} {wt} table...")
print(f"Creating {lang} {wt} table...")
cols = ["word"]
create_table(word_type=wt, cols=cols)

Expand Down Expand Up @@ -306,7 +306,7 @@ def table_insert(word_type, keys):

connection.commit()

print(f"{l} database created.")
print(f"{lang} database created.")

else:
print(f"Skipping {l} database creation as no JSON data files were found.")
print(f"Skipping {lang} database creation as no JSON data files were found.")
2 changes: 1 addition & 1 deletion src/scribe_data/load/send_dbs_to_scribe.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@
PATH_TO_SCRIBE_DATA_SRC = f"{PATH_TO_SCRIBE_ORG}Scribe-Data/src"
sys.path.insert(0, PATH_TO_SCRIBE_DATA_SRC)

from scribe_data.utils import (
from scribe_data.utils import ( # noqa: E402
get_ios_data_path,
get_language_from_iso,
get_path_from_load_dir,
Expand Down

0 comments on commit 6ab8d17

Please sign in to comment.