fix includes with help from include-what-you-use

This commit is contained in:
cebtenzzre 2023-11-01 13:09:21 -04:00
parent 2b5136e1c2
commit 635e9fadfd
57 changed files with 311 additions and 235 deletions

View file

@ -1,20 +1,28 @@
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include "log.h"
#include "sampling.h"
#include <algorithm>
#include <cassert>
#include <cctype>
#include <chrono>
#include <cinttypes>
#include <cmath>
#include <cstring>
#include <cstdlib>
#include <ctime>
#include <exception>
#include <fstream>
#include <iterator>
#include <iostream>
#include <regex>
#include <sstream>
#include <stdexcept>
#include <string>
#include <thread>
#include <unordered_map>
#include <unordered_set>
#include <utility>
#include <vector>
#include <cinttypes>
#if defined(__APPLE__) && defined(__MACH__)
#include <sys/types.h>
@ -32,9 +40,7 @@
#include <fcntl.h>
#include <io.h>
#else
#include <sys/ioctl.h>
#include <sys/stat.h>
#include <unistd.h>
#endif
#if defined(_MSC_VER)

View file

@ -3,19 +3,18 @@
#pragma once
#include "llama.h"
#include "sampling.h"
#define LOG_NO_FILE_LINE_FUNCTION
#include "log.h"
#include <cmath>
#include <string>
#include <vector>
#include <cstdint>
#include <cstdio>
#include <random>
#include <thread>
#include <unordered_map>
#include <string>
#include <tuple>
#include <vector>
#ifdef _WIN32
#define DIRECTORY_SEPARATOR '\\'
@ -68,7 +67,7 @@ struct gpt_params {
int32_t yarn_orig_ctx = 0; // YaRN original context length
int8_t rope_scaling_type = LLAMA_ROPE_SCALING_UNSPECIFIED;
// // sampling parameters
// sampling parameters
struct llama_sampling_params sparams;
std::string model = "models/7B/ggml-model-f16.gguf"; // model path

View file

@ -14,14 +14,13 @@
#define ENABLE_VIRTUAL_TERMINAL_PROCESSING 0x0004
#endif
#else
#include <climits>
#include <clocale>
#include <cstdio>
#include <cwchar>
#include <sys/ioctl.h>
#include <unistd.h>
#include <wchar.h>
#include <stdio.h>
#include <stdlib.h>
#include <signal.h>
#include <termios.h>
#include <unistd.h>
#endif
#define ANSI_COLOR_RED "\x1b[31m"

View file

@ -1,6 +1,5 @@
#include "grammar-parser.h"
#include <cstdint>
#include <cwchar>
#include <string>
#include <utility>
#include <stdexcept>

View file

@ -10,11 +10,14 @@
// space ::= [ \t\n]*
#pragma once
#include "llama.h"
#include <vector>
#include <map>
#include <cstdint>
#include <cstdio>
#include <map>
#include <string>
#include <vector>
namespace grammar_parser {
struct parse_state {

View file

@ -1,5 +1,11 @@
#include "common.h"
#include "sampling.h"
#include <algorithm>
#include <cstdio>
#include <map>
#include <utility>
struct llama_sampling_context * llama_sampling_init(const struct llama_sampling_params & params) {
struct llama_sampling_context * result = new llama_sampling_context();

View file

@ -1,12 +1,12 @@
#pragma once
#include "grammar-parser.h"
#include "llama.h"
#include "grammar-parser.h"
#include <cstdint>
#include <string>
#include <vector>
#include <unordered_map>
#include <vector>
// sampling parameters
typedef struct llama_sampling_params {
@ -56,8 +56,6 @@ struct llama_sampling_context {
std::vector<llama_token_data> cur;
};
#include "common.h"
// Create a new sampling context instance.
struct llama_sampling_context * llama_sampling_init(const struct llama_sampling_params & params);

View file

@ -1,9 +1,19 @@
#include "train.h"
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include "train.h"
#include <algorithm>
#include <cerrno>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <functional>
#include <locale>
#include <random>
#include <sstream>
#include <functional>
struct random_normal_distribution {
std::mt19937 gen;

View file

@ -2,13 +2,14 @@
#pragma once
#include <string>
#include <random>
#include <vector>
#include "ggml.h"
#include "llama.h"
#include <cstddef>
#include <cstdint>
#include <random>
#include <string>
#include <vector>
typedef std::string mt19937_state;
struct train_state {

View file

@ -1,11 +1,13 @@
#include "ggml.h"
#include "train.h"
#include <vector>
#include <algorithm>
#include <cassert>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <random>
#include <vector>
#if defined(_MSC_VER)

View file

@ -1,10 +1,11 @@
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include <algorithm>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <string>
#include <cstdlib>
#include <vector>
// mutates the input string

View file

@ -1,9 +1,11 @@
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include <algorithm>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <string>
#include <vector>

View file

@ -1,29 +1,14 @@
#include "common.h"
#include "llama.h"
#include <algorithm>
#include <cassert>
#include <cinttypes>
#include <cmath>
#include <cstdio>
#include <cstring>
#include <ctime>
#include <fstream>
#include <iostream>
#include <string>
#include <tuple>
#include <vector>
#if defined (__unix__) || (defined (__APPLE__) && defined (__MACH__))
#include <signal.h>
#include <unistd.h>
#elif defined (_WIN32)
#define WIN32_LEAN_AND_MEAN
#ifndef NOMINMAX
# define NOMINMAX
#endif
#include <windows.h>
#include <signal.h>
#endif
// Used for debugging to print out beam tokens.
struct ostream_beam_view {
llama_context * ctx;

View file

@ -1,20 +1,11 @@
#include "common.h"
#include "ggml.h"
#include <locale.h>
#include <assert.h>
#include <math.h>
#include <cstring>
#include <cstdio>
#include <cinttypes>
#include <unordered_map>
#include <queue>
#include <string.h>
#include <cassert>
#include <fstream>
#include <cstdio>
#include <cstdlib>
#include <string>
#include <iterator>
#include <algorithm>
#include <vector>
#if defined(_MSC_VER)
#pragma warning(disable: 4244 4267) // possible loss of data

View file

@ -1,19 +1,22 @@
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include "common.h"
#include <unordered_map>
#include <vector>
#include <cassert>
#include <climits>
#include <cstring>
#include <cstdarg>
#include <ctime>
#include <random>
#include <stdexcept>
#include <sstream>
#include <algorithm>
#include <cassert>
#include <cerrno>
#include <climits>
#include <cmath>
#include <cstdarg>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <sstream>
#include <string>
#include <unordered_map>
#include <utility>
#include <vector>
// GGUF keys & tensor names.

View file

@ -1,7 +1,12 @@
#include "common.h"
#include "llama.h"
#include <algorithm>
#include <cstdio>
#include <ctime>
#include <random>
#include <tuple>
#include <vector>
#if defined(_MSC_VER)
#pragma warning(disable: 4244 4267) // possible loss of data

View file

@ -1,11 +1,16 @@
#include "common.h"
#include "ggml.h"
#include "ggml-alloc.h"
#include <vector>
#include <algorithm>
#include <cerrno>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <string>
#include <thread>
#include <vector>
static const size_t tensor_alignment = 32;

View file

@ -1,19 +1,19 @@
#include "ggml.h"
#include "ggml-alloc.h"
#include "llama.h"
#include "common.h"
#include "ggml-alloc.h"
#include "ggml.h"
#include "llama.h"
#include "train.h"
#include <unordered_map>
#include <vector>
#include <cassert>
#include <climits>
#include <cstring>
#include <cstdarg>
#include <ctime>
#include <random>
#include <stdexcept>
#include <algorithm>
#include <cerrno>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <ctime>
#include <string>
#include <vector>
#if defined(_MSC_VER)
#pragma warning(disable: 4244 4267) // possible loss of data

View file

@ -1,19 +1,17 @@
#include "common.h"
#include "console.h"
#include "llama.h"
#include "grammar-parser.h"
#include "sampling.h"
#include <cassert>
#include <cinttypes>
#include <cmath>
#include <algorithm>
#include <cstdio>
#include <cstring>
#include <cstdlib>
#include <ctime>
#include <fstream>
#include <iostream>
#include <random>
#include <sstream>
#include <string>
#include <tuple>
#include <vector>
#if defined (__unix__) || (defined (__APPLE__) && defined (__MACH__))

View file

@ -1,26 +1,30 @@
#include "ggml.h"
#include "llama.h"
#include "common.h"
#include "ggml-cuda.h"
#include <algorithm>
#include <array>
#include <cassert>
#include <cctype>
#include <chrono>
#include <cinttypes>
#include <clocale>
#include <cmath>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <ctime>
#include <iterator>
#include <map>
#include <memory>
#include <numeric>
#include <regex>
#include <sstream>
#include <string>
#include <utility>
#include <vector>
#include "ggml.h"
#include "llama.h"
#include "common.h"
#include "ggml-cuda.h"
// utils
static uint64_t get_time_ns() {
using clock = std::chrono::high_resolution_clock;

View file

@ -2,21 +2,23 @@
// so there might be still unnecessary artifacts hanging around
// I'll gradually clean and extend it
#include <cassert>
#include "clip.h"
#include "ggml-alloc.h"
#include "ggml.h"
#include <algorithm>
#include <climits>
#include <cmath>
#include <cstdarg>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <fstream>
#include <iostream>
#include <map>
#include <regex>
#include <stdexcept>
#include <string>
#include <vector>
#include "clip.h"
#include "ggml.h"
#include "ggml-alloc.h"
#define STB_IMAGE_IMPLEMENTATION
#include "stb_image.h"

View file

@ -1,7 +1,8 @@
#ifndef CLIP_H
#define CLIP_H
#include "ggml.h"
#include <stddef.h>
#include <stdint.h>
struct clip_ctx;

View file

@ -1,11 +1,14 @@
#include "clip.h"
#include "llava-utils.h"
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include "llava-utils.h"
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <vector>
#include <cstring>
#include <string>
static void show_additional_info(int /*argc*/, char ** argv) {
printf("\n example usage: %s -m <llava-v1.5-7b/ggml-model-q5_k.gguf> --mmproj <llava-v1.5-7b/mmproj-model-f16.gguf> --image <path/to/an/image.jpg> [--temp 0.1] [-p \"describe the image in detail.\"]\n", argv[0]);

View file

@ -1,18 +1,17 @@
#include "common.h"
#include "console.h"
#include "llama.h"
#include "sampling.h"
#include <cassert>
#include <cinttypes>
#include <cmath>
#include <algorithm>
#include <cstdio>
#include <cstring>
#include <cstdlib>
#include <ctime>
#include <fstream>
#include <iostream>
#include <random>
#include <sstream>
#include <string>
#include <tuple>
#include <vector>
#if defined (__unix__) || (defined (__APPLE__) && defined (__MACH__))

View file

@ -2,13 +2,20 @@
// The clients submite requests to the server and they are processed in parallel.
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include "sampling.h"
#include <cmath>
#include <algorithm>
#include <cctype>
#include <cstdint>
#include <cstdio>
#include <string>
#include <vector>
#include <cstdlib>
#include <ctime>
#include <istream>
#include <string>
#include <tuple>
#include <vector>
// trim whitespace from the beginning and end of a string
static std::string trim(const std::string & str) {

View file

@ -1,13 +1,20 @@
#include "common.h"
#include "llama.h"
#include <algorithm>
#include <chrono>
#include <cmath>
#include <cstdio>
#include <cstring>
#include <ctime>
#include <sstream>
#include <thread>
#include <iterator>
#include <mutex>
#include <random>
#include <sstream>
#include <string>
#include <thread>
#include <tuple>
#include <utility>
#include <vector>
#if defined(_MSC_VER)

View file

@ -8,15 +8,16 @@
#include <cinttypes>
#include <cmath>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <map>
#include <iterator>
#include <mutex>
#include <numeric>
#include <regex>
#include <string>
#include <unordered_map>
#include <vector>
#include <thread>
#include <mutex>
#include <utility>
#include <vector>
#if defined(_MSC_VER)
#pragma warning(disable: 4244 4267) // possible loss of data

View file

@ -1,10 +1,14 @@
#include "common.h"
#include "llama.h"
#include <cctype>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <vector>
#include <exception>
#include <string>
#include <vector>
struct quant_option {
std::string name;

View file

@ -1,9 +1,11 @@
#include "common.h"
#include "llama.h"
#include <vector>
#include <cstdint>
#include <cstdio>
#include <chrono>
#include <string>
#include <tuple>
#include <vector>
int main(int argc, char ** argv) {
gpt_params params;

View file

@ -1,6 +1,7 @@
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include "grammar-parser.h"
#include "sampling.h"
#include "../llava/clip.h"
@ -20,10 +21,28 @@
#include "completion.js.hpp"
#include "json-schema-to-grammar.mjs.hpp"
#include <cstddef>
#include <thread>
#include <mutex>
#include <algorithm>
#include <cctype>
#include <chrono>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <ctime>
#include <exception>
#include <functional>
#include <istream>
#include <iterator>
#include <mutex>
#include <numeric>
#include <stdexcept>
#include <string>
#include <thread>
#include <tuple>
#include <unordered_map>
#include <utility>
#include <vector>
#ifndef SERVER_VERBOSE
#define SERVER_VERBOSE 1

View file

@ -1,9 +1,8 @@
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include <cmath>
#include <cstdio>
#include <string>
#include <vector>
int main(int argc, char ** argv) {

View file

@ -1,9 +1,13 @@
#include "common.h"
#include "ggml.h"
#include "llama.h"
#include "sampling.h"
#include <cmath>
#include <algorithm>
#include <cstdio>
#include <cstring>
#include <string>
#include <tuple>
#include <vector>
#define SPEC_VOCAB_MAX_SIZE_DIFFERENCE 100

View file

@ -1,19 +1,18 @@
#include "ggml.h"
#include "ggml-alloc.h"
#include "common.h"
#include "train.h"
#include "ggml-alloc.h"
#include "ggml.h"
#include "llama.h"
#include <unordered_map>
#include <vector>
#include <cassert>
#include <climits>
#include <cstring>
#include <cstdarg>
#include <ctime>
#include <random>
#include <stdexcept>
#include "train.h"
#include <algorithm>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <ctime>
#include <string>
#include <vector>
#if defined(_MSC_VER)
#pragma warning(disable: 4244 4267) // possible loss of data

View file

@ -1,8 +1,9 @@
#include "ggml-alloc.h"
#include "ggml-backend.h"
#include "ggml.h"
#include <assert.h>
#include <stdarg.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

View file

@ -2,6 +2,9 @@
#include "ggml.h"
#include <stdbool.h>
#include <stddef.h>
#ifdef __cplusplus
extern "C" {
#endif

View file

@ -1,8 +1,5 @@
#include "ggml-backend.h"
#include "ggml-alloc.h"
#include <assert.h>
#include <stdarg.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

View file

@ -2,6 +2,9 @@
#include "ggml.h"
#include <stdbool.h>
#include <stddef.h>
#ifdef __cplusplus
extern "C" {
#endif

View file

@ -1,9 +1,9 @@
#pragma once
#include "ggml.h"
// GGML internal header
#include "ggml.h"
#include <assert.h>
#include <stddef.h>
#include <stdbool.h>

View file

@ -1,10 +1,11 @@
#include "ggml-quants.h"
#include "ggml-impl.h"
#include <math.h>
#include <string.h>
#include <assert.h>
#include <float.h>
#include <math.h>
#include <stdbool.h>
#include <string.h>
#ifdef __ARM_NEON

View file

@ -1,11 +1,11 @@
#pragma once
#include "ggml-impl.h"
// GGML internal header
#include "ggml.h"
#include <assert.h>
#include <stdint.h>
#include <stddef.h>
#define QK4_0 32
typedef struct {

10
ggml.c
View file

@ -1,6 +1,7 @@
#define _CRT_SECURE_NO_DEPRECATE // Disables ridiculous "unsafe" warnigns on Windows
#define _USE_MATH_DEFINES // For M_PI on MSVC
#include "ggml.h"
#include "ggml-impl.h"
#include "ggml-quants.h"
@ -20,9 +21,7 @@
#include <inttypes.h>
#include <stdio.h>
#include <float.h>
#include <limits.h>
#include <stdarg.h>
#include <signal.h>
#ifdef GGML_USE_METAL
#include <unistd.h>
@ -85,15 +84,14 @@ static int sched_yield (void) {
return 0;
}
#else
#include <pthread.h>
#include <sched.h>
#include <stdatomic.h>
#include <sys/stat.h>
typedef void * thread_ret_t;
#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
#endif
#ifdef GGML_USE_CPU_HBM

1
ggml.h
View file

@ -300,7 +300,6 @@ extern "C" {
GGML_API void ggml_fp16_to_fp32_row(const ggml_fp16_t * x, float * y, int n);
GGML_API void ggml_fp32_to_fp16_row(const float * x, ggml_fp16_t * y, int n);
struct ggml_object;
struct ggml_context;
enum ggml_type {

View file

@ -52,29 +52,34 @@
#include <algorithm>
#include <array>
#include <cassert>
#include <cerrno>
#include <cinttypes>
#include <climits>
#include <cmath>
#include <cstdarg>
#include <cstddef>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <ctime>
#include <exception>
#include <forward_list>
#include <fstream>
#include <functional>
#include <initializer_list>
#include <iterator>
#include <limits>
#include <map>
#include <memory>
#include <mutex>
#include <numeric>
#include <queue>
#include <random>
#include <regex>
#include <set>
#include <sstream>
#include <stdexcept>
#include <thread>
#include <type_traits>
#include <unordered_map>
#if defined(_MSC_VER)

View file

@ -2,12 +2,14 @@
#define LLAMA_H
#include "ggml.h"
#ifdef GGML_USE_CUBLAS
#include "ggml-cuda.h"
#define LLAMA_MAX_DEVICES GGML_CUDA_MAX_DEVICES
#else
#define LLAMA_MAX_DEVICES 1
#endif // GGML_USE_CUBLAS
#include <stddef.h>
#include <stdint.h>
#include <stdio.h>
@ -759,8 +761,9 @@ extern "C" {
// Internal API to be implemented by llama.cpp and used by tests/benchmarks only
#ifdef LLAMA_API_INTERNAL
#include <vector>
#include <string>
#include <utility>
#include <vector>
struct ggml_tensor;

View file

@ -1,16 +1,13 @@
#include <cstdio>
#include <type_traits>
#include <vector>
#include <random>
#include <chrono>
#include <cstdlib>
#include <cmath>
#include <cassert>
#include <cstring>
#include <array>
#include <type_traits>
#include "ggml.h"
#include <ggml.h>
#include <algorithm>
#include <chrono>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <random>
#include <vector>
constexpr int kVecSize = 1 << 16;

View file

@ -1,14 +1,15 @@
#include <cstdio>
#include <vector>
#include <random>
#include <chrono>
#include <cstdlib>
#include <cmath>
#include <cassert>
#include <cstring>
#include <array>
#include "ggml.h"
#include <ggml.h>
#include <algorithm>
#include <cassert>
#include <chrono>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <random>
#include <utility>
#include <vector>
#if defined(_MSC_VER)
#pragma warning(disable: 4244 4267) // possible loss of data

View file

@ -1,10 +1,11 @@
#define _CRT_SECURE_NO_DEPRECATE // Disables ridiculous "unsafe" warnigns on Windows
#include "ggml.h"
#include <cassert>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cassert>
#if defined(_MSC_VER)
#pragma warning(disable: 4244 4267) // possible loss of data

View file

@ -2,10 +2,16 @@
#undef NDEBUG
#endif
#include "llama.h"
#include "grammar-parser.h"
#include "llama.h"
#include <cassert>
#include <cstdint>
#include <cstdio>
#include <map>
#include <string>
#include <utility>
#include <vector>
int main()
{

View file

@ -6,6 +6,12 @@
#include "grammar-parser.h"
#include <cassert>
#include <cstdint>
#include <cstdio>
#include <map>
#include <string>
#include <utility>
#include <vector>
int main()
{

View file

@ -2,10 +2,9 @@
#include "ggml.h"
#undef NDEBUG
#include <assert.h>
#include <math.h>
#include <stdio.h>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <string>
#include <vector>

View file

@ -2,14 +2,12 @@
#include "ggml.h"
#undef NDEBUG
#include <algorithm>
#include <assert.h>
#include <cinttypes>
#include <cmath>
#include <cstdio>
#include <functional>
#include <inttypes.h>
#include <math.h>
#include <memory>
#include <stdio.h>
#include <string>
#include <vector>

View file

@ -1,9 +1,10 @@
#include "ggml.h"
#include <cassert>
#include <cmath>
#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <cassert>
#include <vector>
#if defined(_MSC_VER)

View file

@ -1,15 +1,9 @@
#include "ggml.h"
#include "llama.h"
#ifdef NDEBUG
#undef NDEBUG
#endif
#include <cmath>
#include <numeric>
#include <cassert>
#include <cstdio>
#include <vector>
#include <algorithm>
static void dump(const llama_token_data_array * candidates) {
for (size_t i = 0; i < candidates->size; i++) {

View file

@ -1,12 +1,14 @@
#include "llama.h"
#include "common.h"
#include "console.h"
#include "llama.h"
#include <cstdio>
#include <string>
#include <map>
#include <vector>
#include <fstream>
#include <iterator>
#include <map>
#include <string>
#include <utility>
#include <vector>
// generate using test-tokenizer-0-falcon.py
static const std::map<std::string, std::vector<llama_token>> & k_tests() {

View file

@ -1,12 +1,14 @@
#include "llama.h"
#include "common.h"
#include "console.h"
#include "llama.h"
#include <cstdio>
#include <string>
#include <map>
#include <vector>
#include <fstream>
#include <iterator>
#include <map>
#include <string>
#include <utility>
#include <vector>
// generate using test-tokenizer-0-llama.py
static const std::map<std::string, std::vector<llama_token>> & k_tests() {

View file

@ -1,16 +1,14 @@
#include "llama.h"
#include "common.h"
#include "unicode.h"
#include "console.h"
#include "ggml.h"
#include "llama.h"
#include "unicode.h"
#include <cassert>
#include <cstdint>
#include <cstdio>
#include <cstring>
#include <stdexcept>
#include <string>
#include <codecvt>
#include <map>
#include <vector>
#include <locale>
int main(int argc, char **argv) {
if (argc < 2) {

View file

@ -1,16 +1,13 @@
#include "llama.h"
#include "common.h"
#include "unicode.h"
#include "console.h"
#include "ggml.h"
#include "llama.h"
#include "unicode.h"
#include <cassert>
#include <cstdint>
#include <cstdio>
#include <cstring>
#include <string>
#include <codecvt>
#include <map>
#include <vector>
#include <locale>
int main(int argc, char **argv) {
if (argc < 2) {