uncharted-distil / distil-auto-ml

Distil Automated Machine Learning Server
Apache License 2.0
2 stars 1 forks source link

Failure on H1BVisa set #197

Closed cdbethune closed 4 years ago

cdbethune commented 4 years ago
WARNING:d3m.utils:Using global/shared random source using 'random.randint' can make execution not reproducible.
Stack (most recent call last):
  File "/usr/lib/python3.6/runpy.py", line 193, in _run_module_as_main
    "__main__", mod_spec)
  File "/usr/lib/python3.6/runpy.py", line 85, in _run_code
    exec(code, run_globals)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 2911, in <module>
    main(sys.argv)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 2907, in main
    cli.runtime_handler(arguments, parser)
  File "/home/chris/dev/git_work/d3m/d3m/cli.py", line 539, in runtime_handler
    problem_resolver=problem_resolver,
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 2534, in fit_score_handler
    runtime_environment=runtime_environment,
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1323, in fit
    result = runtime.fit(inputs, return_values=return_values)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1132, in fit
    return self._run(inputs, metadata_base.PipelineRunPhase.FIT, return_values)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1039, in _run
    self._do_run()
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1025, in _do_run
    self._do_run_step(step)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1008, in _do_run_step
    self._run_step(step)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 998, in _run_step
    self._run_primitive(step)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 873, in _run_primitive
    multi_call_result = self._call_primitive_method(primitive.fit_multi_produce, fit_multi_produce_arguments)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 970, in _call_primitive_method
    result = method(**arguments)
  File "/home/chris/dev/git_work/d3m/d3m/primitive_interfaces/base.py", line 532, in fit_multi_produce
    return self._fit_multi_produce(produce_methods=produce_methods, timeout=timeout, iterations=iterations, inputs=inputs, outputs=outputs)
  File "/home/chris/dev/git_work/d3m/d3m/primitive_interfaces/base.py", line 559, in _fit_multi_produce
    fit_result = self.fit(timeout=timeout, iterations=iterations)
  File "/home/chris/dev/git_work/distil-primitives/distil/primitives/text_encoder.py", line 135, in fit
    self._outputs)  # requires fit transform to fit SVM on vectorizer results
  File "/home/chris/dev/git_work/distil-primitives/distil/preprocessing/transformers.py", line 107, in fit_transform
    out = cross_val_predict(self._model, Xv, y, method='decision_function', n_jobs=self.NUM_JOBS, cv=num_folds)
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/sklearn/model_selection/_validation.py", line 755, in cross_val_predict
    for train, test in cv.split(X, y, groups))
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/joblib/parallel.py", line 874, in __call__
    n_jobs = self._initialize_backend()
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/joblib/parallel.py", line 673, in _initialize_backend
    **self._backend_args)
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/joblib/_parallel_backends.py", line 476, in configure
    **memmappingexecutor_args)
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/joblib/executor.py", line 29, in get_memmapping_executor
    id_executor = random.randint(0, int(1e10))
  File "/home/chris/dev/git_work/d3m/d3m/utils.py", line 1137, in wrapper
    stack_info=True,
  File "/home/chris/dev/git_work/d3m/d3m/utils.py", line 1593, in log_once
    logger.log(level, msg, *args, **kwargs)
Traceback (most recent call last):
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1008, in _do_run_step
    self._run_step(step)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 998, in _run_step
    self._run_primitive(step)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 873, in _run_primitive
    multi_call_result = self._call_primitive_method(primitive.fit_multi_produce, fit_multi_produce_arguments)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 974, in _call_primitive_method
    raise error
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 970, in _call_primitive_method
    result = method(**arguments)
  File "/home/chris/dev/git_work/d3m/d3m/primitive_interfaces/base.py", line 532, in fit_multi_produce
    return self._fit_multi_produce(produce_methods=produce_methods, timeout=timeout, iterations=iterations, inputs=inputs, outputs=outputs)
  File "/home/chris/dev/git_work/d3m/d3m/primitive_interfaces/base.py", line 559, in _fit_multi_produce
    fit_result = self.fit(timeout=timeout, iterations=iterations)
  File "/home/chris/dev/git_work/distil-primitives/distil/primitives/text_encoder.py", line 135, in fit
    self._outputs)  # requires fit transform to fit SVM on vectorizer results
  File "/home/chris/dev/git_work/distil-primitives/distil/preprocessing/transformers.py", line 97, in fit_transform
    Xv  = self._vect.fit_transform(X)
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/sklearn/feature_extraction/text.py", line 1859, in fit_transform
    X = super().fit_transform(raw_documents)
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/sklearn/feature_extraction/text.py", line 1220, in fit_transform
    self.fixed_vocabulary_)
  File "/home/chris/dev/environments/distil-auto-ml/lib/python3.6/site-packages/sklearn/feature_extraction/text.py", line 1150, in _count_vocab
    raise ValueError("empty vocabulary; perhaps the documents only"
ValueError: empty vocabulary; perhaps the documents only contain stop words

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/usr/lib/python3.6/runpy.py", line 193, in _run_module_as_main
    "__main__", mod_spec)
  File "/usr/lib/python3.6/runpy.py", line 85, in _run_code
    exec(code, run_globals)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 2911, in <module>
    main(sys.argv)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 2907, in main
    cli.runtime_handler(arguments, parser)
  File "/home/chris/dev/git_work/d3m/d3m/cli.py", line 539, in runtime_handler
    problem_resolver=problem_resolver,
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 2540, in fit_score_handler
    fit_result.check_success()
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 67, in check_success
    raise self.error
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1039, in _run
    self._do_run()
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1025, in _do_run
    self._do_run_step(step)
  File "/home/chris/dev/git_work/d3m/d3m/runtime.py", line 1017, in _do_run_step
    ) from error
d3m.exceptions.StepFailedError: Step 9 for pipeline f3c58095-e865-4460-bd94-202efde25f30 failed.