examples/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
examples/fairseq/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
examples/fairseq/generate.py,sha256=4opRs__0loOZG6pjvMZvgvAKfRdgj5DjI8cdELqEBm4,236
examples/fairseq/interactive.py,sha256=caBEGlVlsCz_3XZkFnQByKSehuwe9n9uUdyjFscfNVY,239
examples/fairseq/train.py,sha256=0qNw_HMWZ7sTpM-faheyk6OMuTjZsNtyFGpyTAt4Ohw,233
examples/fairseq/criterions/__init__.py,sha256=nU5g8ylzv6OrfQ2ekxO_RDRwmhosPRvqiRrkMRwy0PA,317
examples/fairseq/criterions/masked_lm_moe.py,sha256=7TmKjKfEHGPXpaLkEmZG7fNGtZhK9uzsxmVWgSSlqhQ,2698
examples/fairseq/models/__init__.py,sha256=-puLbQR-evoEuFGAZCS_1IBt6VL7MTLszVzX9U0Y6Oc,1312
examples/fairseq/models/bert.py,sha256=zOA_K0uZcNTtSfplFd18jdCJNJhvhvWUse0MBUSWSFQ,18556
examples/fairseq/models/language_modeling.py,sha256=1sp2h8_hADrXJadSV_Q6_jUb2htHjgEEREYRedGLU8k,14943
examples/fairseq/models/machine_translation.py,sha256=xhWtfXter3UrBwDE2ukdajyTorbfrvZJgqGxltZ2GFE,22595
examples/fairseq/models/retnet.py,sha256=3gLpYYymv9xFb7dO8CeqnLP82M8QTUQst7lvojPVjoI,15919
examples/fairseq/tasks/__init__.py,sha256=qLgl40EN3YWrmyBEvQupSQk3qSaJrnBxsPBUBZ1x3go,1307
examples/fairseq/tasks/pretraining.py,sha256=Ojz3XS5AVA4LsDSuH7Bw_BS-e1HaThFgYsK-p2qtqVo,6882
examples/fairseq/tasks/data/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
examples/fairseq/tasks/data/basic_loader.py,sha256=x3R4Cf5BmxHLh_V6O-Kh6-x-TzaxxMRyEl4BT-N7mCk,1965
examples/fairseq/tasks/data/mlm_loader.py,sha256=3pbDKsXXrP7UKBUPeANXZFN5CO5oreDxe2VsLUCxWHw,11888
examples/fairseq/tasks/data/utils.py,sha256=9AvFLiUYoghQzMztuwItGx18YNNK852LguuOzzJovY4,2801
examples/fairseq/utils/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
examples/fairseq/utils/sparse_clip.py,sha256=xWD6XdOyLxWCW-DEy-MQiUCym5VzAQTdXYx6Bj0EO0o,3051
torchscale/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
torchscale/architecture/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
torchscale/architecture/config.py,sha256=sD93ObIqvq4OR5jfza3p_qEkBDRW3WWLCKJWa23eVMk,16050
torchscale/architecture/decoder.py,sha256=FNK3rDrB0TsIfflabipLxkrVTshjcDI-1bqmgtJ2bL0,15948
torchscale/architecture/encoder.py,sha256=MScVXpNOdP8_9dVHqBmDYFbaaZ9zZpLP6FX7hsH89Vs,13806
torchscale/architecture/encoder_decoder.py,sha256=JaNbxNmpZbpfzVvJMZWb38n0RWze5pc8T1AQzijWtOI,1679
torchscale/architecture/retnet.py,sha256=7WQ7bcXqJ_u1p-cTU0kjWSaqTcypGXjXJsckoyuyPyw,13525
torchscale/architecture/utils.py,sha256=KM-zUFiPkUutIms81i1BIXEUxr-1L6G7cp4avgNmpzQ,1260
torchscale/component/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
torchscale/component/dilated_attention.py,sha256=IxW-HFDb7i5hR0ls3dmko1UrvSBvs61k0xM3e7KL0yE,8000
torchscale/component/droppath.py,sha256=0d95ppYAh5tYQw4s08Xs_Dg1ikXAqF88FLpsctbyslk,558
torchscale/component/embedding.py,sha256=6ZfhhdPPiq_ay_XkVtxnh2VyY7euWtUAvoDBm9Ojsz4,3640
torchscale/component/feedforward_network.py,sha256=x01BMEa6AfQNtN_10cQ5Tx010hA22UJ4FZ-GuxMDnKc,4407
torchscale/component/flash_attention.py,sha256=pV7AeNAPuQgWb96TaOq4LsyzAY_5PFWASN3SGIux69k,4917
torchscale/component/gate_linear_unit.py,sha256=2M5O43q197fKptRKSxCL3oKnWDb8HSvo1d8hafQZo-4,1339
torchscale/component/multihead_attention.py,sha256=Z8AGUrHywEaMiir0DSOkl4gLzhbX6gJkJveMMSblF7I,6403
torchscale/component/multiscale_retention.py,sha256=v3dWg7QC9fgGY3_KOCP_qA_xdV-SRZZEEj2TtCmCvm0,7300
torchscale/component/multiway_network.py,sha256=B5OtpgICMmz_4FAhgONLn38AWTjZOT9pDU05zFva4Gs,1499
torchscale/component/relative_position_bias.py,sha256=snbqdKojZeCI7GcqQlj78iMi6196gQIrDLDzxgzLuj0,2752
torchscale/component/rms_norm.py,sha256=cpVsd5TA5jNsN1T3fKVlqK0_-LRpwsVO-Ag8-wtNWxY,773
torchscale/component/utils.py,sha256=Bm1eleBeSdg4d1bg8n3XHlxV-k6WM5aqRU0y7u78-K0,2170
torchscale/component/xpos_relative_position.py,sha256=0ze6MMW4NwGIOdbEQoMv4SzyN_nZt0ItU9t7IP0YuZE,2197
torchscale/component/xmoe/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
torchscale/component/xmoe/global_groups.py,sha256=IOQ8Inz8Ma5HEvyLV5kBIIgOug-K4xpqK_sJSwVz7vM,2335
torchscale/component/xmoe/moe_layer.py,sha256=NBefmZvRHJ9-RNqXJk5FQgG4lFq1kJTJ4TLOT_yL8FU,12079
torchscale/component/xmoe/routing.py,sha256=nw6Jj6Gdj4C-00dx0j91xTmA0eIQ2cBoR-3WyH78cIg,18530
torchscale/model/BEiT3.py,sha256=pMx7PbuaCJwTO4Z4ddRVyqjmm-eg631JecAP298QScA,3262
torchscale/model/LongNet.py,sha256=vuW2FNAC93Iv8N9DlicL2rct7nGPlXdyDvFLEP_F0aA,2042
torchscale/model/__init__.py,sha256=IbeM5C_urn7B9V2LJQSwn77mwv77tT3Xs-6OotRtbZk,90
torchscale_gml-0.2.0.dist-info/LICENSE,sha256=ws_MuBL-SCEBqPBFl9_FqZkaaydIJmxHrJG2parhU4M,1141
torchscale_gml-0.2.0.dist-info/METADATA,sha256=VdAQY2kCKMJtpGL-Yaapn2t-wIjsgEtTXLX4b6kyr0I,13292
torchscale_gml-0.2.0.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
torchscale_gml-0.2.0.dist-info/top_level.txt,sha256=bTlu3v6diEFqhT3FOfxxu4Ydsi4RPVx_q5ur2fQN4lU,20
torchscale_gml-0.2.0.dist-info/RECORD,,
