diff --git a/README.md b/README.md index a6bdc61..c43f9d1 100644 --- a/README.md +++ b/README.md @@ -137,7 +137,7 @@ image_encoder = Extractor( text_encoder = TextTransformer( dim = 512, num_tokens = 10000, - max_seq_len = 256 + 1, + max_seq_len = 256, depth = 6, heads = 8 ) diff --git a/setup.py b/setup.py index b2b95d6..964939b 100644 --- a/setup.py +++ b/setup.py @@ -3,7 +3,7 @@ setup( name = 'x-clip', packages = find_packages(exclude=[]), - version = '0.0.11', + version = '0.0.12', license='MIT', description = 'X-CLIP', author = 'Phil Wang', diff --git a/x_clip/x_clip.py b/x_clip/x_clip.py index 5fe39e1..7c62e34 100644 --- a/x_clip/x_clip.py +++ b/x_clip/x_clip.py @@ -247,7 +247,7 @@ def __init__( self.text_transformer = TextTransformer( dim = dim_text, num_tokens = num_text_tokens + (1 if use_mlm else 0), - max_seq_len = text_seq_len + 1, + max_seq_len = text_seq_len, depth = text_enc_depth, heads = text_heads )