import torch from modelscope import AutoModelForCausalLM, AutoTokenizer from decoder import decode_vq_tokens model_path = "inclusionAI/LLaDA2.0-Uni" tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True) model = AutoModelForCausalLM.from_pretrained( model_path, device_map="auto", torch_dtype="bfloat16", trust_remote_code=True ).eval() model.tokenizer = tokenizer # Generate image tokens result = model.generate_image( "A modern Scandinavian kitchen with white cabinetry, marble countertops, and a single orchid on the island. A Nordic woman with sleek blonde ponytail, wearing an oversized sweater and dainty silver necklaces, stirs a matcha bowl with a bamboo whisk, eyes sparkling with quiet joy. Shot with 50mm, f/2.5, diffused window light, cool white balance, low saturation, clean skin retouch. Mood: serene, wholesome, hygge.", image_h=1024, image_w=1024, steps=8, cfg_scale=2.0, ) # Decode to PIL image (default: 50-step ODE) image = decode_vq_tokens(result["token_ids"], result["h"], result["w"], model_path, "cuda") image.save("output.png")