Qwen2-VL-inference/docs/restful.md at main · ZachcZhang/Qwen2-VL-inference

restful request

import requests
import sys
import json

def fetch_qwen2vl(user_info):
    endpoint = "http://127.0.0.1:10102/v1/chat/completions"
    headers = {
        'Content-Type': 'application/json',
    }
    payload = json.dumps({
        "model": "qwen2vl",
        "messages": [
            {
                "role": "user",
                "content": [
                    {
                        "type": "image",
                        "image": "https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-VL/assets/demo.jpeg",
                    },
                    {"type": "text", "text": "请详细描述这张图片."},
                ],
            }
        ],
        "stream":True,
        "max_tokens":512
        
    })
    response =  requests.post(endpoint, headers=headers, data=payload, stream=True)
    for chunk in response.iter_lines(): 
        if chunk:
            decoded_line = chunk.decode('utf-8')
            data = decoded_line[len("data: "):].strip()
            try:
                data = json.loads(data)
                choieces = data["choices"][0]
                if choieces["finish_reason"] is not None:
                    break
                sys.stdout.write(choieces["delta"]["content"])
                sys.stdout.flush()
                
            except Exception as e:
                pass

def main():
    question = """
    请描述图片
    """
    fetch_qwen2vl(question)
    
if __name__ == "__main__":
    main()

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

restful request

FilesExpand file tree

restful.md

Latest commit

History

restful.md

File metadata and controls

restful request