clefourrier HF staff commited on
Commit
6eb8bfd
·
1 Parent(s): daf60ae

Update src/submission/check_validity.py

Browse files
Files changed (1) hide show
  1. src/submission/check_validity.py +6 -12
src/submission/check_validity.py CHANGED
@@ -31,26 +31,20 @@ def check_model_card(repo_id: str) -> tuple[bool, str]:
31
 
32
  return True, ""
33
 
34
-
35
  def is_model_on_hub(model_name: str, revision: str, token: str = None, trust_remote_code=False, test_tokenizer=False) -> tuple[bool, str]:
36
- """Makes sure the model is on the hub, and uses a valid configuration (in the latest transformers version)"""
37
  try:
38
  config = AutoConfig.from_pretrained(model_name, revision=revision, trust_remote_code=trust_remote_code, token=token)
39
  if test_tokenizer:
40
- tokenizer_config = get_tokenizer_config(model_name)
41
- if tokenizer_config is not None:
42
- tokenizer_class_candidate = tokenizer_config.get("tokenizer_class", None)
43
- else:
44
- tokenizer_class_candidate = config.tokenizer_class
45
-
46
-
47
- tokenizer_class = tokenizer_class_from_name(tokenizer_class_candidate)
48
- if tokenizer_class is None:
49
  return (
50
  False,
51
- f"uses {tokenizer_class_candidate}, which is not in a transformers release, therefore not supported at the moment.",
52
  None
53
  )
 
 
54
  return True, None, config
55
 
56
  except ValueError:
 
31
 
32
  return True, ""
33
 
 
34
  def is_model_on_hub(model_name: str, revision: str, token: str = None, trust_remote_code=False, test_tokenizer=False) -> tuple[bool, str]:
 
35
  try:
36
  config = AutoConfig.from_pretrained(model_name, revision=revision, trust_remote_code=trust_remote_code, token=token)
37
  if test_tokenizer:
38
+ try:
39
+ tk = AutoTokenizer.from_pretrained(model_name, revision=revision, trust_remote_code=trust_remote_code, token=token)
40
+ except ValueError as e:
 
 
 
 
 
 
41
  return (
42
  False,
43
+ f"uses a tokenizer which is not in a transformers release: {e}",
44
  None
45
  )
46
+ except Exception as e:
47
+ return (False, "'s tokenizer cannot be loaded. Is your tokenizer class in a stable transformers release, and correctly configured?", None)
48
  return True, None, config
49
 
50
  except ValueError: