Update README.md
Browse files
README.md
CHANGED
|
@@ -123,9 +123,10 @@ from transformers import pipeline
|
|
| 123 |
|
| 124 |
classifier = pipeline("text-classification", model="DiligentAI/urlbert-url-classifier")
|
| 125 |
result = classifier("https://store.myshopify.com")
|
| 126 |
-
|
| 127 |
-
|
| 128 |
Pydantic Integration (Production-Ready)
|
|
|
|
| 129 |
from transformers import pipeline
|
| 130 |
from pydantic import BaseModel, Field
|
| 131 |
from typing import Literal
|
|
@@ -146,7 +147,6 @@ def classify_url(url: str) -> URLClassificationResult:
|
|
| 146 |
label=label_map[result["label"]],
|
| 147 |
confidence=result["score"]
|
| 148 |
)
|
| 149 |
-
```
|
| 150 |
|
| 151 |
Limitations and Bias
|
| 152 |
Max URL Length: Model trained on 64-token sequences. Longer URLs are truncated.
|
|
@@ -171,6 +171,7 @@ Language detection
|
|
| 171 |
Spam filtering
|
| 172 |
Model Card Authors
|
| 173 |
DiligentAI Team
|
|
|
|
| 174 |
Citation
|
| 175 |
@misc{urlbert-classifier-2025,
|
| 176 |
author = {DiligentAI},
|
|
@@ -198,6 +199,7 @@ Model checkpoint (.safetensors)
|
|
| 198 |
Tokenizer configuration
|
| 199 |
Label mapping (label_map.json)
|
| 200 |
Performance metrics (metrics.json)
|
|
|
|
| 201 |
Contact
|
| 202 |
For issues, questions, or feedback:
|
| 203 |
GitHub: DiligentAI/url-classifier
|
|
|
|
| 123 |
|
| 124 |
classifier = pipeline("text-classification", model="DiligentAI/urlbert-url-classifier")
|
| 125 |
result = classifier("https://store.myshopify.com")
|
| 126 |
+
|
| 127 |
+
|
| 128 |
Pydantic Integration (Production-Ready)
|
| 129 |
+
|
| 130 |
from transformers import pipeline
|
| 131 |
from pydantic import BaseModel, Field
|
| 132 |
from typing import Literal
|
|
|
|
| 147 |
label=label_map[result["label"]],
|
| 148 |
confidence=result["score"]
|
| 149 |
)
|
|
|
|
| 150 |
|
| 151 |
Limitations and Bias
|
| 152 |
Max URL Length: Model trained on 64-token sequences. Longer URLs are truncated.
|
|
|
|
| 171 |
Spam filtering
|
| 172 |
Model Card Authors
|
| 173 |
DiligentAI Team
|
| 174 |
+
|
| 175 |
Citation
|
| 176 |
@misc{urlbert-classifier-2025,
|
| 177 |
author = {DiligentAI},
|
|
|
|
| 199 |
Tokenizer configuration
|
| 200 |
Label mapping (label_map.json)
|
| 201 |
Performance metrics (metrics.json)
|
| 202 |
+
|
| 203 |
Contact
|
| 204 |
For issues, questions, or feedback:
|
| 205 |
GitHub: DiligentAI/url-classifier
|