File size: 601 Bytes
120dee6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
CC		:= gcc
CFLAGS	:= -O3 -static -march=native -ffast-math #-Wall -Wextra -Werror
CLIBS	:= -lc

TARGET	:= bin/tokenizer
SRCS	:= $(wildcard src/*.c)



all:	$(TARGET)

clean:	
	rm -f $(TARGET) bin/*

run:	all
	./$(TARGET) \
		--dataset_path          data/dataset_tinystories-v2_100k-rows.txt \
		--vocab_path            data/vocab_tinstories-v2_size-4096_wordlen-12.txt \
		--dataset_output_path   bin/dataset_tinystories-v2_100k-rows.bin \
		--tokenizer_output_path bin/tokenizer_tinystories-v2_size-4096_wordlen-12.bin



$(TARGET):	$(SRCS)
	$(CC) $(CFLAGS) $(CLIBS) -o $@ $^



.PHONY:	all clean run