Spaces:

Vokturz
/

transformers-js-playground

Running

App Files Files Community

transformers-js-playground / src /lib /huggingface.ts

Vokturz

Refactor model selection and info display

6ebf2fd about 1 month ago

raw

history blame

4.35 kB

	import { ModelInfoResponse, QuantizationType } from "../types"

	const getModelInfo = async (modelName: string): Promise<ModelInfoResponse> => {
	const token = process.env.REACT_APP_HUGGINGFACE_TOKEN

	if (!token) {
	throw new Error(
	'Hugging Face token not found. Please set REACT_APP_HUGGINGFACE_TOKEN in your .env file'
	)
	}

	const response = await fetch(
	`https://huggingface.co/api/models/${modelName}`,
	{
	method: 'GET',
	headers: {
	Authorization: `Bearer ${token}`
	}
	}
	)

	if (!response.ok) {
	throw new Error(`Failed to fetch model info: ${response.statusText}`)
	}

	const modelData: ModelInfoResponse = await response.json()

	const requiredFiles = [
	'config.json',
	'tokenizer.json',
	'tokenizer_config.json',
	]

	const siblingFiles = modelData.siblings?.map(s => s.rfilename) \|\| []
	const isCompatible =
	requiredFiles.every((file) => siblingFiles.includes(file)) &&
	siblingFiles.some((file) => file.endsWith('.onnx') && file.startsWith('onnx/'))
	const incompatibilityReason = isCompatible
	? ''
	: `Missing required files: ${requiredFiles
	.filter(file => !siblingFiles.includes(file))
	.join(', ')}`
	const supportedQuantizations = siblingFiles
	.filter((file) => file.endsWith('.onnx') && file.includes('_'))
	.map((file) => file.split('/')[1].split('_')[1].split('.')[0])
	.filter((q) => q !== 'quantized')
	const uniqueSupportedQuantizations = Array.from(new Set(supportedQuantizations))
	uniqueSupportedQuantizations.sort((a, b) => {
	const getNumericValue = (str: string) => {
	const match = str.match(/(\d+)/)
	return match ? parseInt(match[1]) : Infinity
	}
	return getNumericValue(a) - getNumericValue(b)
	})

	// If there's a base model, fetch its info and merge with compatibility data
	const baseModel = modelData.cardData?.base_model ?? modelData.modelId
	if (baseModel && !modelData.safetensors) {
	const baseModelResponse = await fetch(
	`https://huggingface.co/api/models/${baseModel}`,
	{
	method: 'GET',
	headers: {
	Authorization: `Bearer ${token}`
	}
	}
	)

	if (baseModelResponse.ok) {
	const baseModelData: ModelInfoResponse = await baseModelResponse.json()

	return {
	...baseModelData,
	id: modelData.id,
	baseId: baseModel,
	isCompatible,
	incompatibilityReason,
	supportedQuantizations: uniqueSupportedQuantizations as QuantizationType[]
	}
	}
	}

	return {
	...modelData,
	isCompatible,
	incompatibilityReason,
	supportedQuantizations: uniqueSupportedQuantizations as QuantizationType[]
	}
	}

	const getModelsByPipeline = async (
	pipeline_tag: string
	): Promise<ModelInfoResponse[]> => {
	const token = process.env.REACT_APP_HUGGINGFACE_TOKEN

	if (!token) {
	throw new Error(
	'Hugging Face token not found. Please set REACT_APP_HUGGINGFACE_TOKEN in your .env file'
	)
	}

	const response = await fetch(
	`https://huggingface.co/api/models?filter=${pipeline_tag}&filter=transformers.js&sort=downloads`,
	{
	method: 'GET',
	headers: {
	Authorization: `Bearer ${token}`
	}
	}
	)

	if (!response.ok) {
	throw new Error(`Failed to fetch models for pipeline: ${response.statusText}`)
	}
	const models = await response.json()
	if (pipeline_tag === 'text-classification') {
	return models.filter((model: ModelInfoResponse) => !model.tags.includes('reranker') && !model.id.includes('reranker')).slice(0, 10)
	}
	return models.slice(0, 10)
	}

	function getModelSize(
	parameters: number,
	quantization: QuantizationType
	): number {
	let bytesPerParameter: number

	switch (quantization) {
	case 'fp32':
	// 32-bit floating point uses 4 bytes
	bytesPerParameter = 4
	break
	case 'fp16':
	bytesPerParameter = 2
	break
	case 'int8':
	case 'bnb8':
	case 'uint8':
	case 'q8':
	bytesPerParameter = 1
	break
	case 'bnb4':
	case 'q4':
	bytesPerParameter = 0.5
	break
	}

	// There are 1,024 * 1,024 bytes in a megabyte
	const sizeInBytes = parameters * bytesPerParameter
	const sizeInMB = sizeInBytes / (1024 * 1024)

	return sizeInMB
	}


	export { getModelInfo, getModelSize, getModelsByPipeline }