tokenizer / Makefile
flopml's picture
tracking with lfs
120dee6
raw
history blame contribute delete
601 Bytes
CC := gcc
CFLAGS := -O3 -static -march=native -ffast-math #-Wall -Wextra -Werror
CLIBS := -lc
TARGET := bin/tokenizer
SRCS := $(wildcard src/*.c)
all: $(TARGET)
clean:
rm -f $(TARGET) bin/*
run: all
./$(TARGET) \
--dataset_path data/dataset_tinystories-v2_100k-rows.txt \
--vocab_path data/vocab_tinstories-v2_size-4096_wordlen-12.txt \
--dataset_output_path bin/dataset_tinystories-v2_100k-rows.bin \
--tokenizer_output_path bin/tokenizer_tinystories-v2_size-4096_wordlen-12.bin
$(TARGET): $(SRCS)
$(CC) $(CFLAGS) $(CLIBS) -o $@ $^
.PHONY: all clean run