import tiktoken import hashlib from flask import jsonify, make_response _encoding = None def get_encoding(): global _encoding if _encoding is None: _encoding = tiktoken.get_encoding("cl100k_base") return _encoding def num_tokens_from_string(string: str) -> int: encoding = get_encoding() if isinstance(string, str): num_tokens = len(encoding.encode(string)) return num_tokens else: return 0 def num_tokens_from_object_or_list(thing): if isinstance(thing, list): return sum([num_tokens_from_object_or_list(x) for x in thing]) elif isinstance(thing, dict): return sum([num_tokens_from_object_or_list(x) for x in thing.values()]) elif isinstance(thing, str): return num_tokens_from_string(thing) else: return 0 def count_tokens_docs(docs): docs_content = "" for doc in docs: docs_content += doc.page_content tokens = num_tokens_from_string(docs_content) return tokens def check_required_fields(data, required_fields): missing_fields = [field for field in required_fields if field not in data] if missing_fields: return make_response( jsonify( { "success": False, "message": f"Missing fields: {', '.join(missing_fields)}", } ), 400, ) return None def get_hash(data): return hashlib.md5(data.encode()).hexdigest()