fix pipeline tag
Browse files- README.md +1 -1
- inference.py +5 -8
README.md
CHANGED
|
@@ -9,7 +9,7 @@ tags:
|
|
| 9 |
- url-slug
|
| 10 |
- beam-search
|
| 11 |
library_name: onnxruntime
|
| 12 |
-
pipeline_tag:
|
| 13 |
---
|
| 14 |
|
| 15 |
# vec2slug-v1-large
|
|
|
|
| 9 |
- url-slug
|
| 10 |
- beam-search
|
| 11 |
library_name: onnxruntime
|
| 12 |
+
pipeline_tag: summarization
|
| 13 |
---
|
| 14 |
|
| 15 |
# vec2slug-v1-large
|
inference.py
CHANGED
|
@@ -269,9 +269,7 @@ class SlugPredictor(ABC):
|
|
| 269 |
candidates.append((new_log_prob, new_tokens))
|
| 270 |
|
| 271 |
# Rank by partial objective for consistent pruning
|
| 272 |
-
candidates.sort(
|
| 273 |
-
key=lambda x: self._partial_score(x[0], x[1]), reverse=True
|
| 274 |
-
)
|
| 275 |
active = candidates[:k]
|
| 276 |
|
| 277 |
# Optimal stopping: best completed dominates all active upper bounds
|
|
@@ -304,8 +302,7 @@ class SlugPredictor(ABC):
|
|
| 304 |
|
| 305 |
# Deduplicate and rank
|
| 306 |
scored = [
|
| 307 |
-
(self._score(log_prob, tokens), tokens)
|
| 308 |
-
for log_prob, tokens in completed
|
| 309 |
]
|
| 310 |
scored.sort(key=lambda x: -x[0])
|
| 311 |
|
|
@@ -400,9 +397,9 @@ def _load_pytorch_model(model_dir: Path, model_config: ModelConfig):
|
|
| 400 |
self.token_embedding = nn.Embedding(vocab_size, embed_dim, padding_idx=0)
|
| 401 |
self.position_embedding = nn.Embedding(max_length + 1, embed_dim)
|
| 402 |
self.dropout = nn.Dropout(dropout)
|
| 403 |
-
self.blocks = nn.ModuleList(
|
| 404 |
-
|
| 405 |
-
)
|
| 406 |
self.ln_final = nn.LayerNorm(embed_dim)
|
| 407 |
self.output_projection = nn.Linear(embed_dim, vocab_size)
|
| 408 |
|
|
|
|
| 269 |
candidates.append((new_log_prob, new_tokens))
|
| 270 |
|
| 271 |
# Rank by partial objective for consistent pruning
|
| 272 |
+
candidates.sort(key=lambda x: self._partial_score(x[0], x[1]), reverse=True)
|
|
|
|
|
|
|
| 273 |
active = candidates[:k]
|
| 274 |
|
| 275 |
# Optimal stopping: best completed dominates all active upper bounds
|
|
|
|
| 302 |
|
| 303 |
# Deduplicate and rank
|
| 304 |
scored = [
|
| 305 |
+
(self._score(log_prob, tokens), tokens) for log_prob, tokens in completed
|
|
|
|
| 306 |
]
|
| 307 |
scored.sort(key=lambda x: -x[0])
|
| 308 |
|
|
|
|
| 397 |
self.token_embedding = nn.Embedding(vocab_size, embed_dim, padding_idx=0)
|
| 398 |
self.position_embedding = nn.Embedding(max_length + 1, embed_dim)
|
| 399 |
self.dropout = nn.Dropout(dropout)
|
| 400 |
+
self.blocks = nn.ModuleList([
|
| 401 |
+
DecoderBlock(embed_dim, num_heads, dropout) for _ in range(num_layers)
|
| 402 |
+
])
|
| 403 |
self.ln_final = nn.LayerNorm(embed_dim)
|
| 404 |
self.output_projection = nn.Linear(embed_dim, vocab_size)
|
| 405 |
|