Name
rickiepark's repositories
wiki
GRPO_From_Scratch_Multi_GPU_DataParallel_Qwen_2_5_1_5B_Instruct.ipynb
GRPO_Qwen_0_5_Instruct.ipynb
byte_pair_encoding.ipynb
count_language_model.ipynb
document_classifier_with_LLMs_as_labelers.ipynb
emotion_GPT2_as_classifier.ipynb
emotion_GPT2_as_text_generator.ipynb
emotion_GPT2_as_text_generator_LoRA.ipynb
emotion_classifier_CNN.ipynb
emotion_classifier_LR.ipynb
instruct_GPT2.ipynb
news_RNN_language_model.ipynb
news_decoder_language_model.ipynb
sampling_method.ipynb
GRPO.py
README.md
embedding_vs_linear.py
quadratic_loss.py
spotify_gemini_playlist.py