i am just following the documentation steps..
File ~/cluster-env/trident_env/lib/python3.11/site-packages/py4j/protocol.py:326, in get_return_value(answer, gateway_client, target_id, name) 324 value = OUTPUT_CONVERTER[type](answer[2:], gateway_client) 325 if answer[1] == REFERENCE_TYPE: --> 326 raise Py4JJavaError( 327 "An error occurred while calling {0}{1}{2}.\n". 328 format(target_id, ".", name), value) 329 else: 330 raise Py4JError( 331 "An error occurred while calling {0}{1}{2}. Trace:\n{3}\n". 332 format(target_id, ".", name, value)) Py4JJavaError: An error occurred while calling o7561.execute. : scala.NotImplementedError: an implementation is missing at scala.Predef$.$qmark$qmark$qmark(Predef.scala:288) at com.microsoft.fabric.spark.catalog.OnelakeExternalCatalog.functionExists(OnelakeExternalCatalog.scala:403) at com.microsoft.fabric.spark.catalog.InstrumentedExternalCatalog.$anonfun$functionExists$1(OnelakeExternalCatalog.scala:624) at scala.runtime.java8.JFunction0$mcZ$sp.apply(JFunction0$mcZ$sp.java:23) at com.microsoft.fabric.spark.catalog.metadata.Helpers$.timed(Helpers.scala:107) at com.microsoft.fabric.spark.catalog.InstrumentedExternalCatalog.functionExists(OnelakeExternalCatalog.scala:624) at org.apache.spark.sql.catalyst.catalog.ExternalCatalogWithListener.$anonfun$functionExists$1(ExternalCatalogWithListener.scala:341) at scala.runtime.java8.JFunction0$mcZ$sp.apply(JFunction0$mcZ$sp.java:23) at com.microsoft.fabric.spark.catalog.metrics.Helpers$.timed(CatalogMetricsHelper.scala:64) at org.apache.spark.sql.catalyst.catalog.ExternalCatalogWithListener.functionExists(ExternalCatalogWithListener.scala:341) at org.apache.spark.sql.catalyst.catalog.SessionCatalog.functionExists(SessionCatalog.scala:1580) at org.apache.spark.sql.internal.CatalogImpl.functionExists(CatalogImpl.scala:549) at zingg.spark.core.util.SparkFnRegistrar.registerUDF2(SparkFnRegistrar.java:21) at zingg.spark.core.preprocess.stopwords.SparkStopWordsRemover.registerUDF(SparkStopWordsRemover.java:60) at zingg.spark.core.preprocess.stopwords.SparkStopWordsRemover.init(SparkStopWordsRemover.java:65) at zingg.common.core.preprocess.IPreprocessors.executeAndBuildPreprocessedDF(IPreprocessors.java:53) at zingg.common.core.preprocess.IPreprocessors.preprocess(IPreprocessors.java:35) at zingg.common.core.executor.TrainingDataFinder.getPositiveSamples(TrainingDataFinder.java:198) at zingg.common.core.executor.TrainingDataFinder.execute(TrainingDataFinder.java:69) at zingg.common.client.Client.execute(Client.java:281) at java.base/jdk.internal.reflect.NativeMethodAccessorImpl.invoke0(Native Method) at java.base/jdk.internal.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62) at java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) at java.base/java.lang.reflect.Method.invoke(Method.java:566) at py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244) at py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:374) at py4j.Gateway.invoke(Gateway.java:282) at py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132) at py4j.commands.CallCommand.execute(CallCommand.java:79) at py4j.GatewayConnection.run(GatewayConnection.java:238) at java.base/java.lang.Thread.run(Thread.java:829)
which fabric env are you on? please use 1.3
i am using 1.3 only...
zingg 0.5.0?
Name: zingg Version: 0.5.0 Summary: Zingg Entity Resolution, Data Mastering and Deduplication Home-page: https://github.com/zinggAI/zingg Author: Zingg.AI Author-email: sonalgoyal4@gmail.com License: https://github.com/zinggAI/zingg/blob/main/LICENSE Location: /home/trusted-service-user/cluster-env/trident_env/lib/python3.11/site-packages Requires: py4j Required-by: Note: you may need to restart the kernel to use updated packages.
any updates
still same error..
['--phase', 'findTrainingData'] arguments for client options are ['--phase', 'findTrainingData', '--license', 'zinggLic.txt', '--email', 'zingg@zingg.ai', '--conf', 'dummyConf.json'] <zingg.client.Arguments object at 0x7652eb0b3090> <zingg.client.ClientOptions object at 0x7652eb0bc1d0> <zingg.client.ZinggWithSpark object at 0x7652eafe4a90> --------------------------------------------------------------------------- Py4JJavaError Traceback (most recent call last) Cell In[148], line 8 6 print(options) 7 print(zingg) ----> 8 zingg.initAndExecute() File ~/cluster-env/trident_env/lib/python3.11/site-packages/zingg/client.py:280, in Zingg.initAndExecute(self) 278 self.client.execute() 279 else: --> 280 self.client.execute() File ~/cluster-env/trident_env/lib/python3.11/site-packages/py4j/java_gateway.py:1322, in __call__(self, *args) 1317 def __init__(self, target_id, gateway_client): 1318 """ 1319 :param target_id: the identifier of the object on the JVM side. Given 1320 by the JVM. 1321 -> 1322 :param gateway_client: the gateway client used to communicate with 1323 the JVM. 1324 """ 1325 self._target_id = target_id 1326 self._gateway_client = gateway_client File /opt/spark/python/lib/pyspark.zip/pyspark/errors/exceptions/captured.py:179, in capture_sql_exception.<locals>.deco(*a, **kw) 177 def deco(*a: Any, **kw: Any) -> Any: 178 try: --> 179 return f(*a, **kw) 180 except Py4JJavaError as e: 181 converted = convert_exception(e.java_exception) File ~/cluster-env/trident_env/lib/python3.11/site-packages/py4j/protocol.py:326, in get_return_value(answer, gateway_client, target_id, name) 324 value = OUTPUT_CONVERTER[type](answer[2:], gateway_client) 325 if answer[1] == REFERENCE_TYPE: --> 326 raise Py4JJavaError( 327 "An error occurred while calling {0}{1}{2}.\n". 328 format(target_id, ".", name), value) 329 else: 330 raise Py4JError( 331 "An error occurred while calling {0}{1}{2}. Trace:\n{3}\n". 332 format(target_id, ".", name, value)) Py4JJavaError: An error occurred while calling o7654.execute. : scala.NotImplementedError: an implementation is missing at scala.Predef$.$qmark$qmark$qmark(Predef.scala:288) at com.microsoft.fabric.spark.catalog.OnelakeExternalCatalog.functionExists(OnelakeExternalCatalog.scala:403) at com.microsoft.fabric.spark.catalog.InstrumentedExternalCatalog.$anonfun$functionExists$1(OnelakeExternalCatalog.scala:624) at scala.runtime.java8.JFunction0$mcZ$sp.apply(JFunction0$mcZ$sp.java:23) at com.microsoft.fabric.spark.catalog.metadata.Helpers$.timed(Helpers.scala:107) at com.microsoft.fabric.spark.catalog.InstrumentedExternalCatalog.functionExists(OnelakeExternalCatalog.scala:624) at org.apache.spark.sql.catalyst.catalog.ExternalCatalogWithListener.$anonfun$functionExists$1(ExternalCatalogWithListener.scala:341) at scala.runtime.java8.JFunction0$mcZ$sp.apply(JFunction0$mcZ$sp.java:23) at com.microsoft.fabric.spark.catalog.metrics.Helpers$.timed(CatalogMetricsHelper.scala:64) at org.apache.spark.sql.catalyst.catalog.ExternalCatalogWithListener.functionExists(ExternalCatalogWithListener.scala:341) at org.apache.spark.sql.catalyst.catalog.SessionCatalog.functionExists(SessionCatalog.scala:1580) at org.apache.spark.sql.internal.CatalogImpl.functionExists(CatalogImpl.scala:549) at zingg.spark.core.util.SparkFnRegistrar.registerUDF2(SparkFnRegistrar.java:21) at zingg.spark.core.preprocess.stopwords.SparkStopWordsRemover.registerUDF(SparkStopWordsRemover.java:60) at zingg.spark.core.preprocess.stopwords.SparkStopWordsRemover.init(SparkStopWordsRemover.java:65) at zingg.common.core.preprocess.IPreprocessors.executeAndBuildPreprocessedDF(IPreprocessors.java:53) at zingg.common.core.preprocess.IPreprocessors.preprocess(IPreprocessors.java:35) at zingg.common.core.executor.TrainingDataFinder.getPositiveSamples(TrainingDataFinder.java:198) at zingg.common.core.executor.TrainingDataFinder.execute(TrainingDataFinder.java:69) at zingg.common.client.Client.execute(Client.java:281) at java.base/jdk.internal.reflect.NativeMethodAccessorImpl.invoke0(Native Method) at java.base/jdk.internal.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62) at java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) at java.base/java.lang.reflect.Method.invoke(Method.java:566) at py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244) at py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:374) at py4j.Gateway.invoke(Gateway.java:282) at py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132) at py4j.commands.CallCommand.execute(CallCommand.java:79) at py4j.GatewayConnection.run(GatewayConnection.java:238) at java.base/java.lang.Thread.run(Thread.java:829)