| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| |
|
|
| CONTROLLER_HEART_BEAT_EXPIRATION = 30 |
| WORKER_HEART_BEAT_INTERVAL = 15 |
|
|
| LOGDIR = "." |
|
|
| |
| IGNORE_INDEX = -100 |
| DEFAULT_IMAGE_TOKEN = "<image>" |
| DEFAULT_SOUND_TOKEN = "<sound>" |
| DEFAULT_SPEECH_TOKEN = "<speech>" |
| SENTINEL_TOKEN = "<vila/sentinel>" |
| DEFAULT_IM_START_TOKEN = "<im_start>" |
| DEFAULT_IM_END_TOKEN = "<im_end>" |
|
|
|
|
| SENTINEL_TOKEN = "<vila/sentinel>" |
|
|
| MEDIA_TOKENS = { |
| "image": "<image>", |
| "video": "<vila/video>", |
| "speech": "<speech>", |
| "sound": "<sound>", |
| } |
|
|
| |
| """ |
| vila: |
| 151643: AddedToken("<|endoftext|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151644: AddedToken("<|im_start|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151645: AddedToken("<|im_end|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151646: AddedToken("[BOS]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151647: AddedToken("[PAD]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151648: AddedToken("<vila/sentinel>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151649: AddedToken("<image>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151650: AddedToken("<vila/video>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| |
| xvila: |
| 151643: AddedToken("<|endoftext|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151644: AddedToken("<|im_start|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151645: AddedToken("<|im_end|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151646: AddedToken("[BOS]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151647: AddedToken("[PAD]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151648: AddedToken("<vila/sentinel>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151649: AddedToken("<image>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151650: AddedToken("<vila/video>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151651: AddedToken("<speech>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151652: AddedToken("<sound>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151653: AddedToken("<|image_bos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151654: AddedToken("<|image_eos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151655: AddedToken("<|video_bos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151656: AddedToken("<|video_eos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151657: AddedToken("<|speech_bos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151658: AddedToken("<|speech_eos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151659: AddedToken("<|sound_bos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| 151660: AddedToken("<|sound_eos|>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True), |
| """ |
| MM_BOS_EOS_TOKENS = { |
| "image": ["<|image_bos|>", "<|image_eos|>"], |
| "video": ["<|video_bos|>", "<|video_eos|>"], |
| "speech": ["<|speech_bos|>", "<|speech_eos|>"], |
| "sound": ["<|sound_bos|>", "<|sound_eos|>"], |
| } |
|
|
| NUM_EXTRA_TOKENS_VILA = 8 |
| NUM_EXTRA_TOKENS_XVILA = 10 |
|
|