pip install ctransformers
from ctransformers import AutoModelForCausalLM

llm = AutoModelForCausalLM.from_pretrained('marella/gpt-2-ggml')

print(llm('AI is going to'))

See https://github.com/marella/ctransformers