"매 새로운 content 의 의 의 의 model — 매 text, image, audio, video, code, 3D". 매 modern: Claude, GPT, Gemini, Llama (text), Midjourney/DALL-E/SD (image), Suno (audio), Sora/Veo (video). 매 transformer + diffusion 의 dominant.
fromanthropicimportAnthropicclient=Anthropic()r=client.messages.create(model='claude-opus-4-7',max_tokens=1024,messages=[{'role':'user','content':'Write a haiku about AI'}])
Image (Stable Diffusion)
fromdiffusersimportStableDiffusionXLPipelinepipe=StableDiffusionXLPipeline.from_pretrained('stabilityai/sdxl-turbo',torch_dtype=torch.float16).to('cuda')img=pipe('a sunset over mountains',num_inference_steps=4).images[0]
# 매 image → 3D modelmesh=tripo_client.image_to_mesh('input.png')mesh.save('output.glb')
Multimodal (Claude vision)
client.messages.create(model='claude-opus-4-7',max_tokens=1024,messages=[{'role':'user','content':[{'type':'image','source':{'type':'base64','media_type':'image/jpeg','data':img_b64}},{'type':'text','text':'Describe this image'},]}])
Agent (multi-step)
defagent_loop(goal,tools,max_steps=10):history=[{'role':'user','content':goal}]for_inrange(max_steps):r=client.messages.create(model='claude-opus-4-7',tools=tools,messages=history)ifr.stop_reason=='end_turn':returnr# 매 execute tool, append result
defwell_formed_prompt(task,context,examples=[],format='json'):returnf"""## Context
{context}## Examples
{format_examples(examples)}## Task
{task}## Output format
{format}"""
RAG-augmented gen
defrag_generate(question,retriever,llm):docs=retriever.retrieve(question,k=5)context='\n'.join(d.textfordindocs)returnllm.generate(f"Context:\n{context}\n\nQuestion: {question}\nAnswer with citations:")
Fine-tune (LoRA)
frompeftimportLoraConfig,get_peft_modelconfig=LoraConfig(r=16,lora_alpha=32,target_modules=['q_proj','v_proj'])model=get_peft_model(base_model,config)# 매 train on task data