MCPcopy
hub / github.com/Lightricks/ComfyUI-LTXVideo / _enhance

Function _enhance

gemma_encoder.py:402–448  ·  view source on GitHub ↗

Common enhancement logic for both T2V and I2V modes.

(
    processor: Gemma3Processor,
    model: Gemma3ForConditionalGeneration,
    messages: list,
    image: Optional[Image.Image] = None,
    max_new_tokens: int = 512,
    seed: int = 42,
)

Source from the content-addressed store, hash-verified

400
401
402def _enhance(
403 processor: Gemma3Processor,
404 model: Gemma3ForConditionalGeneration,
405 messages: list,
406 image: Optional[Image.Image] = None,
407 max_new_tokens: int = 512,
408 seed: int = 42,
409) -> str:
410 """Common enhancement logic for both T2V and I2V modes."""
411 if processor is None:
412 raise ValueError("Processor not loaded - enhancement not available")
413
414 text = processor.tokenizer.apply_chat_template(
415 messages, tokenize=False, add_generation_prompt=True
416 )
417
418 model_inputs = processor(
419 text=text,
420 images=image,
421 return_tensors="pt",
422 ).to(model.device)
423
424 pad_token_id = (
425 processor.tokenizer.pad_token_id
426 if processor.tokenizer.pad_token_id is not None
427 else 0
428 )
429 model_inputs = _pad_inputs_for_attention_alignment(model_inputs, pad_token_id)
430
431 with (
432 torch.inference_mode(),
433 torch.random.fork_rng(devices=[model.device]),
434 torch.autocast(device_type=model.device.type, dtype=model.dtype),
435 ):
436 torch.manual_seed(seed)
437 outputs = model.generate(
438 **model_inputs,
439 max_new_tokens=max_new_tokens,
440 do_sample=True,
441 temperature=0.7,
442 )
443 generated_ids = outputs[0][len(model_inputs.input_ids[0]) :]
444 enhanced_prompt = processor.tokenizer.decode(
445 generated_ids, skip_special_tokens=True
446 )
447
448 return enhanced_prompt
449
450
451def enhance_t2v(

Callers 2

enhance_t2vFunction · 0.85
enhance_i2vFunction · 0.85

Calls 3

decodeMethod · 0.80
generateMethod · 0.45

Tested by

no test coverage detected