|
CC := gcc |
|
CFLAGS := -O3 -static -march=native -ffast-math |
|
CLIBS := -lc |
|
|
|
TARGET := bin/tokenizer |
|
SRCS := $(wildcard src/*.c) |
|
|
|
|
|
|
|
all: $(TARGET) |
|
|
|
clean: |
|
rm -f $(TARGET) bin/* |
|
|
|
run: all |
|
./$(TARGET) \ |
|
--dataset_path data/dataset_tinystories-v2_100k-rows.txt \ |
|
--vocab_path data/vocab_tinstories-v2_size-4096_wordlen-12.txt \ |
|
--dataset_output_path bin/dataset_tinystories-v2_100k-rows.bin \ |
|
--tokenizer_output_path bin/tokenizer_tinystories-v2_size-4096_wordlen-12.bin |
|
|
|
|
|
|
|
$(TARGET): $(SRCS) |
|
$(CC) $(CFLAGS) $(CLIBS) -o $@ $^ |
|
|
|
|
|
|
|
.PHONY: all clean run |