This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| MODEL_TO_USE = "NanoV2" # or "MistralNemo" | |
| IMPORT_MODEL_AND_DATA = False # set to True to import the model from HF hub, only needs to be run once | |
| REASONING_STYLE = "gpt_oss_120b" # or DeepSeek_R1_0528 | |
| NUM_NODES = 2 | |
| GPUS_PER_NODE = 8 | |
| import nemo_run as run | |
| from nemo.collections import llm | |
| from nemo.collections.llm.gpt.model.mistral import MistralModel, MistralNeMoConfig12B | |
| from nemo.collections.llm.gpt.model.ssm import MambaModel, NemotronNano12Bv2 |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| #:package ARSoft.Tools.Net@3.6.1 | |
| #:package LLMTornado@3.7.25 | |
| using ARSoft.Tools.Net; | |
| using ARSoft.Tools.Net.Dns; | |
| using LlmTornado.Code; | |
| using LlmTornado; | |
| using LlmTornado.Chat; | |
| (string EnvKey, LLmProviders Provider)[] Providers = [ |