Shannon Skipper havenwood

Models

In order to offload to GPU a model must fit in VRAM.

The following table lists models assuming Q4_K_M quantization. You can always use a model that fits in a smaller VRAM size.

	require 'io/stream'
	require 'open3'

	module Command
	Result = Data.define(:out, :err, :status)

	def self.run(, *)
	Open3.popen3(, *) do \|stdin, stdout, stderr, thread\|
	stdin.close

	signal = 'ALRM'
	status = Signal.list.fetch(signal) + 2**7

	pid = fork do
	trap signal do
	warn 'Alarm!'
	exit status
	end

	sleep

	require 'stringio'
	require 'zlib'

	io = StringIO.new('Zip me...')
	zipped_io = StringIO.new('', 'a+b')

	writer = Zlib::GzipWriter.new(zipped_io)
	IO.copy_stream(io, writer)
	writer.finish
	zipped_io.rewind

	#!/usr/bin/env -S zsh -e

	help() {
	print -u2 -- "Usage: $ZSH_ARGZERO [options] [directory...]

	Options:
	-h, --help Output this help message
	-v, --version Output program name and version"
	exit ${1:-0}
	}

	#!/usr/bin/env -S zsh -e

	zparseopts -D -F -- \
	g:=opt_gb -reserve-gb:=opt_gb \
	p:=opt_percent -reclaim-percent:=opt_percent \
	h=opt_help -help=opt_help \
	v=opt_version -version=opt_version

	if (( ${#opt_help} )); then
	print -- "Usage: $(basename $0) [options]

	# Caching dramatically improves performance when portions of the
	# factorial calculation are repeated.
	class UnaryFactorial < Module
	class NegativeError < StandardError
	def initialize(message = 'Factorials cannot be negative') = super
	end

	attr_accessor :cache

	##

	class Ractor
	module Channel
	def self.new(&block)
	channel = Ractor.new do
	loop do
	Ractor.yield Ractor.receive
	end
	end

	return block.call(channel) if block_given?