File size: 1,418 Bytes
ad9a66f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
from flask import Flask, request, jsonify
from transformers import AutoTokenizer
import os

app = Flask(__name__)

# 加载tokenizer
tokenizer = AutoTokenizer.from_pretrained(os.path.dirname(__file__))

@app.route('/count_tokens', methods=['POST'])
def count_tokens():
    try:
        data = request.json
        messages = data.get('messages', [])
        system = data.get('system')
        
        # 构建完整文本
        text = ""
        if system:
            text += f"System: {system}\n\n"
            
        for msg in messages:
            role = msg.get('role', '')
            content = msg.get('content', '')
            if role == 'user':
                text += f"User: {content}\n"
            elif role == 'assistant':
                text += f"Assistant: {content}\n"
            else:
                text += f"{role}: {content}\n"
        
        # 计算token数量
        tokens = tokenizer.encode(text)
        token_count = len(tokens)
        
        return jsonify({
            'input_tokens': token_count
        })
    except Exception as e:
        return jsonify({
            'error': str(e)
        }), 400

@app.route('/health', methods=['GET'])
def health():
    return jsonify({
        'status': 'healthy',
        'tokenizer': 'deepseek-v3'
    })

if __name__ == '__main__':
    app.run(host='127.0.0.1', port=7861)