@@ -44,7 +44,7 @@ class CPMTransformer(AnnotatorModel, HasBatchedAnnotate, HasEngine):
4444 ... .setOutputCol("generation")
4545
4646
47- The default model is ``"llam2-7b "``, if no name is provided. For available
47+ The default model is ``"mini_cpm_2b_8bit "``, if no name is provided. For available
4848 pretrained models please see the `Models Hub
4949 <https://sparknlp.org/models?q=cpm>`__.
5050
@@ -104,7 +104,7 @@ class CPMTransformer(AnnotatorModel, HasBatchedAnnotate, HasEngine):
104104 >>> documentAssembler = DocumentAssembler() \\
105105 ... .setInputCol("text") \\
106106 ... .setOutputCol("documents")
107- >>> cpm = CPMTransformer.pretrained("llama_2_7b_chat_hf_int4 ") \\
107+ >>> cpm = CPMTransformer.pretrained("mini_cpm_2b_8bit","xx ") \\
108108 ... .setInputCols(["documents"]) \\
109109 ... .setMaxOutputLength(50) \\
110110 ... .setOutputCol("generation")
@@ -299,15 +299,15 @@ def loadSavedModel(folder, spark_session, use_openvino = False):
299299 return CPMTransformer (java_model = jModel )
300300
301301 @staticmethod
302- def pretrained (name = "llama_2_7b_chat_hf_int4 " , lang = "en " , remote_loc = None ):
302+ def pretrained (name = "mini_cpm_2b_8bit " , lang = "xx " , remote_loc = None ):
303303 """Downloads and loads a pretrained model.
304304
305305 Parameters
306306 ----------
307307 name : str, optional
308- Name of the pretrained model, by default "llama_2_7b_chat_hf_int4 "
308+ Name of the pretrained model, by default "mini_cpm_2b_8bit "
309309 lang : str, optional
310- Language of the pretrained model, by default "en "
310+ Language of the pretrained model, by default "xx "
311311 remote_loc : str, optional
312312 Optional remote address of the resource, by default None. Will use
313313 Spark NLPs repositories otherwise.
0 commit comments