indietyp commited on
Commit
c7d6720
·
verified ·
1 Parent(s): 0991c68

fix pipeline tag

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. inference.py +5 -8
README.md CHANGED
@@ -9,7 +9,7 @@ tags:
9
  - url-slug
10
  - beam-search
11
  library_name: onnxruntime
12
- pipeline_tag: text2text-generation
13
  ---
14
 
15
  # vec2slug-v1-large
 
9
  - url-slug
10
  - beam-search
11
  library_name: onnxruntime
12
+ pipeline_tag: summarization
13
  ---
14
 
15
  # vec2slug-v1-large
inference.py CHANGED
@@ -269,9 +269,7 @@ class SlugPredictor(ABC):
269
  candidates.append((new_log_prob, new_tokens))
270
 
271
  # Rank by partial objective for consistent pruning
272
- candidates.sort(
273
- key=lambda x: self._partial_score(x[0], x[1]), reverse=True
274
- )
275
  active = candidates[:k]
276
 
277
  # Optimal stopping: best completed dominates all active upper bounds
@@ -304,8 +302,7 @@ class SlugPredictor(ABC):
304
 
305
  # Deduplicate and rank
306
  scored = [
307
- (self._score(log_prob, tokens), tokens)
308
- for log_prob, tokens in completed
309
  ]
310
  scored.sort(key=lambda x: -x[0])
311
 
@@ -400,9 +397,9 @@ def _load_pytorch_model(model_dir: Path, model_config: ModelConfig):
400
  self.token_embedding = nn.Embedding(vocab_size, embed_dim, padding_idx=0)
401
  self.position_embedding = nn.Embedding(max_length + 1, embed_dim)
402
  self.dropout = nn.Dropout(dropout)
403
- self.blocks = nn.ModuleList(
404
- [DecoderBlock(embed_dim, num_heads, dropout) for _ in range(num_layers)]
405
- )
406
  self.ln_final = nn.LayerNorm(embed_dim)
407
  self.output_projection = nn.Linear(embed_dim, vocab_size)
408
 
 
269
  candidates.append((new_log_prob, new_tokens))
270
 
271
  # Rank by partial objective for consistent pruning
272
+ candidates.sort(key=lambda x: self._partial_score(x[0], x[1]), reverse=True)
 
 
273
  active = candidates[:k]
274
 
275
  # Optimal stopping: best completed dominates all active upper bounds
 
302
 
303
  # Deduplicate and rank
304
  scored = [
305
+ (self._score(log_prob, tokens), tokens) for log_prob, tokens in completed
 
306
  ]
307
  scored.sort(key=lambda x: -x[0])
308
 
 
397
  self.token_embedding = nn.Embedding(vocab_size, embed_dim, padding_idx=0)
398
  self.position_embedding = nn.Embedding(max_length + 1, embed_dim)
399
  self.dropout = nn.Dropout(dropout)
400
+ self.blocks = nn.ModuleList([
401
+ DecoderBlock(embed_dim, num_heads, dropout) for _ in range(num_layers)
402
+ ])
403
  self.ln_final = nn.LayerNorm(embed_dim)
404
  self.output_projection = nn.Linear(embed_dim, vocab_size)
405