Andrei abetlen

484 followers · 25 following

Patagona Technologies
Toronto, Canada
@abetlen

View GitHub Profile

Recently created

Least recently created

Recently updated

Least recently updated

abetlen / idefics2_to_gguf.py

Last active June 5, 2024 14:36

	import os
	import json
	import typing
	import pathlib
	import argparse

	import numpy as np
	import numpy.typing as npt
	import gguf
	from gguf import KEY_ATTENTION_HEAD_COUNT, KEY_ATTENTION_LAYERNORM_EPS, KEY_BLOCK_COUNT, KEY_EMBEDDING_LENGTH, KEY_FEED_FORWARD_LENGTH, GGUFWriter, TokenType, SpecialVocab

abetlen / create_paligemma_gguf.py

Created May 27, 2024 02:46

	import os
	import argparse
	import numpy as np
	import numpy.typing as npt
	import gguf
	from safetensors import safe_open

	import json
	import typing

abetlen / main.py

Last active April 6, 2024 19:42

	from llama_cpp import Llama
	from llama_cpp.llama_chat_format import Llava15ChatHandler
	chat_handler = Llava15ChatHandler(clip_model_path="llava-1.6-mistral-7b-gguf/mmproj-model-f16.gguf")
	llm = Llama(
	model_path="llava-1.6-mistral-7b-gguf/llava-v1.6-mistral-7b.Q4_K_M.gguf",
	chat_handler=chat_handler,
	n_ctx=2048, # n_ctx should be increased to accomodate the image embedding
	logits_all=True,# needed to make llava work
	n_gpu_layers=-1
	)