dwb2023 commited on
Commit
8dba9f0
·
verified ·
1 Parent(s): 06b7155

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -17,12 +17,12 @@ YT_LENGTH_LIMIT_S = 4800 # 1 hour limit
17
  device = 0 if torch.cuda.is_available() else "cpu"
18
  pipe = pipeline(task="automatic-speech-recognition", model=MODEL_NAME, chunk_length_s=30, device=device)
19
 
20
- JSON_DATASET_DIR = Path("youtube-transcripts")
21
  JSON_DATASET_DIR.mkdir(parents=True, exist_ok=True)
22
  JSON_DATASET_PATH = JSON_DATASET_DIR / f"transcriptions-{uuid4()}.json"
23
 
24
  scheduler = CommitScheduler(
25
- repo_id="your-dataset-repo",
26
  repo_type="dataset",
27
  folder_path=JSON_DATASET_DIR,
28
  path_in_repo="data",
 
17
  device = 0 if torch.cuda.is_available() else "cpu"
18
  pipe = pipeline(task="automatic-speech-recognition", model=MODEL_NAME, chunk_length_s=30, device=device)
19
 
20
+ JSON_DATASET_DIR = Path("json_dataset")
21
  JSON_DATASET_DIR.mkdir(parents=True, exist_ok=True)
22
  JSON_DATASET_PATH = JSON_DATASET_DIR / f"transcriptions-{uuid4()}.json"
23
 
24
  scheduler = CommitScheduler(
25
+ repo_id="transcript-dataset",
26
  repo_type="dataset",
27
  folder_path=JSON_DATASET_DIR,
28
  path_in_repo="data",