|
""" |
|
Here, what should you do here? |
|
just upload all idioms here - name it as epie. |
|
""" |
|
import os |
|
from idiomify.paths import ROOT_DIR |
|
from idiomify.fetchers import fetch_pie |
|
import argparse |
|
import wandb |
|
|
|
|
|
def main(): |
|
parser = argparse.ArgumentParser() |
|
parser.add_argument("--ver", type=str, default="pie_v0", |
|
choices=["pie_v0", "pie_v1"]) |
|
config = vars(parser.parse_args()) |
|
|
|
|
|
if config['ver'] == "pie_v0": |
|
|
|
idioms = set([row[0] for row in fetch_pie()[:106]]) |
|
elif config['ver'] == "pie_v1": |
|
|
|
idioms = set([row[0] for row in fetch_pie()]) |
|
else: |
|
raise NotImplementedError |
|
idioms = list(idioms) |
|
|
|
with wandb.init(entity="eubinecto", project="idiomify", config=config) as run: |
|
artifact = wandb.Artifact(name="idioms", type="dataset") |
|
txt_path = ROOT_DIR / "all.txt" |
|
with open(txt_path, 'w') as fh: |
|
for idiom in idioms: |
|
fh.write(idiom + "\n") |
|
artifact.add_file(txt_path) |
|
run.log_artifact(artifact, aliases=["latest", config['ver']]) |
|
os.remove(txt_path) |
|
|
|
|
|
if __name__ == '__main__': |
|
main() |
|
|