Skip to content

WIP [DeepSeek R1] Add DeepSeekV3 Base + Weight Conversion #2171

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 10 commits into
base: master
Choose a base branch
from
16 changes: 8 additions & 8 deletions keras_hub/api/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,12 +4,12 @@
since your modifications would be overwritten.
"""

from keras_hub.api import layers
from keras_hub.api import metrics
from keras_hub.api import models
from keras_hub.api import samplers
from keras_hub.api import tokenizers
from keras_hub.api import utils
from keras_hub.src.utils.preset_utils import upload_preset
from keras_hub.api import layers as layers
from keras_hub.api import metrics as metrics
from keras_hub.api import models as models
from keras_hub.api import samplers as samplers
from keras_hub.api import tokenizers as tokenizers
from keras_hub.api import utils as utils
from keras_hub.src.utils.preset_utils import upload_preset as upload_preset
from keras_hub.src.version_utils import __version__
from keras_hub.src.version_utils import version
from keras_hub.src.version_utils import version as version
120 changes: 81 additions & 39 deletions keras_hub/api/layers/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,74 +4,116 @@
since your modifications would be overwritten.
"""

from keras_hub.src.layers.modeling.alibi_bias import AlibiBias
from keras_hub.src.layers.modeling.anchor_generator import AnchorGenerator
from keras_hub.src.layers.modeling.box_matcher import BoxMatcher
from keras_hub.src.layers.modeling.alibi_bias import AlibiBias as AlibiBias
from keras_hub.src.layers.modeling.anchor_generator import (
AnchorGenerator as AnchorGenerator,
)
from keras_hub.src.layers.modeling.box_matcher import BoxMatcher as BoxMatcher
from keras_hub.src.layers.modeling.cached_multi_head_attention import (
CachedMultiHeadAttention,
CachedMultiHeadAttention as CachedMultiHeadAttention,
)
from keras_hub.src.layers.modeling.f_net_encoder import (
FNetEncoder as FNetEncoder,
)
from keras_hub.src.layers.modeling.masked_lm_head import (
MaskedLMHead as MaskedLMHead,
)
from keras_hub.src.layers.modeling.non_max_supression import (
NonMaxSuppression as NonMaxSuppression,
)
from keras_hub.src.layers.modeling.position_embedding import (
PositionEmbedding as PositionEmbedding,
)
from keras_hub.src.layers.modeling.f_net_encoder import FNetEncoder
from keras_hub.src.layers.modeling.masked_lm_head import MaskedLMHead
from keras_hub.src.layers.modeling.non_max_supression import NonMaxSuppression
from keras_hub.src.layers.modeling.position_embedding import PositionEmbedding
from keras_hub.src.layers.modeling.reversible_embedding import (
ReversibleEmbedding,
ReversibleEmbedding as ReversibleEmbedding,
)
from keras_hub.src.layers.modeling.rms_normalization import (
RMSNormalization as RMSNormalization,
)
from keras_hub.src.layers.modeling.rotary_embedding import (
RotaryEmbedding as RotaryEmbedding,
)
from keras_hub.src.layers.modeling.rms_normalization import RMSNormalization
from keras_hub.src.layers.modeling.rotary_embedding import RotaryEmbedding
from keras_hub.src.layers.modeling.sine_position_encoding import (
SinePositionEncoding,
SinePositionEncoding as SinePositionEncoding,
)
from keras_hub.src.layers.modeling.token_and_position_embedding import (
TokenAndPositionEmbedding,
TokenAndPositionEmbedding as TokenAndPositionEmbedding,
)
from keras_hub.src.layers.modeling.transformer_decoder import (
TransformerDecoder as TransformerDecoder,
)
from keras_hub.src.layers.modeling.transformer_encoder import (
TransformerEncoder as TransformerEncoder,
)
from keras_hub.src.layers.preprocessing.audio_converter import (
AudioConverter as AudioConverter,
)
from keras_hub.src.layers.preprocessing.image_converter import (
ImageConverter as ImageConverter,
)
from keras_hub.src.layers.modeling.transformer_decoder import TransformerDecoder
from keras_hub.src.layers.modeling.transformer_encoder import TransformerEncoder
from keras_hub.src.layers.preprocessing.audio_converter import AudioConverter
from keras_hub.src.layers.preprocessing.image_converter import ImageConverter
from keras_hub.src.layers.preprocessing.masked_lm_mask_generator import (
MaskedLMMaskGenerator,
MaskedLMMaskGenerator as MaskedLMMaskGenerator,
)
from keras_hub.src.layers.preprocessing.multi_segment_packer import (
MultiSegmentPacker,
MultiSegmentPacker as MultiSegmentPacker,
)
from keras_hub.src.layers.preprocessing.random_deletion import (
RandomDeletion as RandomDeletion,
)
from keras_hub.src.layers.preprocessing.random_swap import (
RandomSwap as RandomSwap,
)
from keras_hub.src.layers.preprocessing.start_end_packer import (
StartEndPacker as StartEndPacker,
)
from keras_hub.src.layers.preprocessing.random_deletion import RandomDeletion
from keras_hub.src.layers.preprocessing.random_swap import RandomSwap
from keras_hub.src.layers.preprocessing.start_end_packer import StartEndPacker
from keras_hub.src.models.basnet.basnet_image_converter import (
BASNetImageConverter,
BASNetImageConverter as BASNetImageConverter,
)
from keras_hub.src.models.clip.clip_image_converter import (
CLIPImageConverter as CLIPImageConverter,
)
from keras_hub.src.models.clip.clip_image_converter import CLIPImageConverter
from keras_hub.src.models.deeplab_v3.deeplab_v3_image_converter import (
DeepLabV3ImageConverter,
DeepLabV3ImageConverter as DeepLabV3ImageConverter,
)
from keras_hub.src.models.densenet.densenet_image_converter import (
DenseNetImageConverter,
DenseNetImageConverter as DenseNetImageConverter,
)
from keras_hub.src.models.efficientnet.efficientnet_image_converter import (
EfficientNetImageConverter,
EfficientNetImageConverter as EfficientNetImageConverter,
)
from keras_hub.src.models.mit.mit_image_converter import (
MiTImageConverter as MiTImageConverter,
)
from keras_hub.src.models.mit.mit_image_converter import MiTImageConverter
from keras_hub.src.models.mobilenet.mobilenet_image_converter import (
MobileNetImageConverter,
MobileNetImageConverter as MobileNetImageConverter,
)
from keras_hub.src.models.pali_gemma.pali_gemma_image_converter import (
PaliGemmaImageConverter,
PaliGemmaImageConverter as PaliGemmaImageConverter,
)
from keras_hub.src.models.resnet.resnet_image_converter import (
ResNetImageConverter,
ResNetImageConverter as ResNetImageConverter,
)
from keras_hub.src.models.retinanet.retinanet_image_converter import (
RetinaNetImageConverter,
RetinaNetImageConverter as RetinaNetImageConverter,
)
from keras_hub.src.models.sam.sam_image_converter import (
SAMImageConverter as SAMImageConverter,
)
from keras_hub.src.models.sam.sam_mask_decoder import (
SAMMaskDecoder as SAMMaskDecoder,
)
from keras_hub.src.models.sam.sam_prompt_encoder import (
SAMPromptEncoder as SAMPromptEncoder,
)
from keras_hub.src.models.sam.sam_image_converter import SAMImageConverter
from keras_hub.src.models.sam.sam_mask_decoder import SAMMaskDecoder
from keras_hub.src.models.sam.sam_prompt_encoder import SAMPromptEncoder
from keras_hub.src.models.segformer.segformer_image_converter import (
SegFormerImageConverter,
SegFormerImageConverter as SegFormerImageConverter,
)
from keras_hub.src.models.vgg.vgg_image_converter import (
VGGImageConverter as VGGImageConverter,
)
from keras_hub.src.models.vit.vit_image_converter import (
ViTImageConverter as ViTImageConverter,
)
from keras_hub.src.models.vgg.vgg_image_converter import VGGImageConverter
from keras_hub.src.models.vit.vit_image_converter import ViTImageConverter
from keras_hub.src.models.whisper.whisper_audio_converter import (
WhisperAudioConverter,
WhisperAudioConverter as WhisperAudioConverter,
)
10 changes: 5 additions & 5 deletions keras_hub/api/metrics/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,8 @@
since your modifications would be overwritten.
"""

from keras_hub.src.metrics.bleu import Bleu
from keras_hub.src.metrics.edit_distance import EditDistance
from keras_hub.src.metrics.perplexity import Perplexity
from keras_hub.src.metrics.rouge_l import RougeL
from keras_hub.src.metrics.rouge_n import RougeN
from keras_hub.src.metrics.bleu import Bleu as Bleu
from keras_hub.src.metrics.edit_distance import EditDistance as EditDistance
from keras_hub.src.metrics.perplexity import Perplexity as Perplexity
from keras_hub.src.metrics.rouge_l import RougeL as RougeL
from keras_hub.src.metrics.rouge_n import RougeN as RougeN
Loading