Two files needed to make DeepSeek work properly with Codex CLI:
model = "deepseek-reasoner"
model_provider = "deepseek-reasoner"
approval_policy = "on-failure"Note
(2025-01-08) Add feature for 🏷️Tag(Revision) Selection, contributed by @Bamboo-D.
(2024-12-17) Add feature for ⚡Quick Startup and ⏭️Fast Resume, enabling skipping of downloaded files, while removing the git clone dependency to accelerate file list retrieval.
Considering the lack of multi-threaded download support in the official huggingface-cli, and the inadequate error handling in hf_transfer, This command-line tool leverages curl and aria2c for fast and robust downloading of models and datasets.
This is comparison between whisper.cpp and faster-whisper. The faster-whisper readme has some benchmarks on the readme but wanted to test it myself. For whisper, I just ran manually. For faster-whisper, wrote this small script
Latest Update: May 19th, 2024
This gist contains all the steps required to:
CUDA 11.8 and CUDA 12.1Environment Modules is a package that provides for the dynamic modification of a user's environment via modulefiles. You can find more on it at https://modules.readthedocs.io/en/latest/
| # Taken from https://johanwind.github.io/2023/03/23/rwkv_details.html. | |
| # I've added additional comments restructured it a tiny bit, which makes it clearer for me. | |
| import numpy as np | |
| from torch import load as torch_load # Only for loading the model weights | |
| from tokenizers import Tokenizer | |
| exp = np.exp | |
| layer_norm = lambda x, w, b : (x - np.mean(x)) / np.std(x) * w + b | |
| sigmoid = lambda x : 1/(1 + exp(-x)) |
| # This example uses M2M-100 models converted to the CTranslate2 format. | |
| # Download CTranslate2 models: | |
| # • M2M-100 418M-parameter model: https://bit.ly/33fM1AO | |
| # • M2M-100 1.2B-parameter model: https://bit.ly/3GYiaed | |
| import ctranslate2 | |
| import sentencepiece as spm | |
| # Based on https://gist.github.com/bastibe/c0950e463ffdfdfada7adf149ae77c6f | |
| # Changes: | |
| # * Instead of overriding cd, we detect directory change. This allows the script to work | |
| # for other means of cd, such as z. | |
| # * Update syntax to work with new versions of fish. | |
| # * Handle virtualenvs that are not located in the root of a git directory. | |
| function __auto_source_venv --on-variable PWD --description "Activate/Deactivate virtualenv on directory change" | |
| status --is-command-substitution; and return |
| import logging | |
| import socks # use pysocks | |
| import asyncio | |
| from datetime import datetime | |
| from itertools import cycle | |
| logging.basicConfig(level=logging.INFO) | |
| socks_router_loop = cycle(( # simple round-robin router to socks proxies | |
| ('127.2.0.0', 9050, None, None), # address, port, username, password | |
| # ('127.3.0.0', 9050, "proxy", "passwordpassword"), |
| # MIT License | |
| # | |
| # Copyright (c) 2019 Cristian Adam | |
| # | |
| # Permission is hereby granted, free of charge, to any person obtaining a copy | |
| # of this software and associated documentation files (the "Software"), to deal | |
| # in the Software without restriction, including without limitation the rights | |
| # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | |
| # copies of the Software, and to permit persons to whom the Software is | |
| # furnished to do so, subject to the following conditions: |
| import asyncio | |
| import logging | |
| import re | |
| from asyncio import StreamReader, StreamWriter, StreamReaderProtocol | |
| from collections import namedtuple | |
| from typing import Optional | |
| import socks # use pysocks | |
| logging.basicConfig(level=logging.INFO) |