Packages

t

com.johnsnowlabs.ml.gguf

LLMLoaderInferenceParams

trait LLMLoaderInferenceParams[T] extends AnyRef

Linear Supertypes
AnyRef, Any
Known Subclasses
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. LLMLoaderInferenceParams
  2. AnyRef
  3. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Value Members

  1. final def !=(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int
    Definition Classes
    AnyRef → Any
  3. final def ==(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  4. final def asInstanceOf[T0]: T0
    Definition Classes
    Any
  5. def clone(): AnyRef
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  6. final def eq(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  7. def equals(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  8. def finalize(): Unit
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  9. final def getClass(): Class[_]
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  10. def getSystemPrompt: String
  11. def hashCode(): Int
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  12. val inferenceParameters: InferenceParameters
    Attributes
    protected
  13. final def isInstanceOf[T0]: Boolean
    Definition Classes
    Any
  14. def loadParamsMap(paramsMap: Map[String, Any]): Unit
    Attributes
    protected
  15. final def ne(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  16. final def notify(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  17. final def notifyAll(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  18. val paramsMap: Map[String, Any]
    Attributes
    protected
  19. def setCachePrompt(cachePrompt: Boolean): T

    Whether to remember the prompt to avoid reprocessing it

  20. def setDynamicTemperatureExponent(dynatempExponent: Float): T

    Set the dynamic temperature exponent (default: 1.0)

  21. def setDynamicTemperatureRange(dynatempRange: Float): T

    Set the dynamic temperature range (default: 0.0, 0.0 = disabled)

  22. def setFrequencyPenalty(frequencyPenalty: Float): T

    Set the repetition alpha frequency penalty (default: 0.0, 0.0 = disabled)

  23. def setGrammar(grammar: String): T

    Set BNF-like grammar to constrain generations (see samples in grammars/ dir)

  24. def setIgnoreEos(ignoreEos: Boolean): T

    Set whether to ignore end of stream token and continue generating (implies --logit-bias 2-inf)

  25. def setInputPrefix(inputPrefix: String): T

    Set a prefix for infilling (default: empty)

  26. def setInputSuffix(inputSuffix: String): T

    Set a suffix for infilling (default: empty)

  27. def setMinKeep(minKeep: Int): T

    Set the amount of tokens the samplers should return at least (0 = disabled)

  28. def setMinP(minP: Float): T

    Set min-p sampling (default: 0.1, 0.0 = disabled)

  29. def setMiroStatEta(mirostatEta: Float): T

    Set the MiroStat learning rate, parameter eta (default: 0.1)

  30. def setMiroStatTau(mirostatTau: Float): T

    Set the MiroStat target entropy, parameter tau (default: 5.0)

  31. def setNKeep(nKeep: Int): T

    Set the number of tokens to keep from the initial prompt (default: 0, -1 = all)

  32. def setNPredict(nPredict: Int): T

    Set the number of tokens to predict (default: -1, -1 = infinity, -2 = until context filled)

  33. def setNProbs(nProbs: Int): T

    Set the amount top tokens probabilities to output if greater than 0.

  34. def setPenalizeNl(penalizeNl: Boolean): T

    Whether to penalize newline tokens

  35. def setPenaltyPrompt(tokens: ArrayList[Int]): T
  36. def setPenaltyPrompt(tokens: Array[Int]): T

    Override which tokens to penalize for repetition.

    Override which tokens to penalize for repetition. E.g. if original prompt is "Alice: Hello!" and penaltyPrompt corresponds to the token ids of "Hello!", only the latter will be penalized if repeated. See pull request 3727 for more details.

  37. def setPenaltyPrompt(penaltyPrompt: String): T

    Override which part of the prompt is penalized for repetition.

    Override which part of the prompt is penalized for repetition. E.g. if original prompt is "Alice: Hello!" and penaltyPrompt is "Hello!", only the latter will be penalized if repeated. See pull request 3727 for more details.

  38. def setPresencePenalty(presencePenalty: Float): T

    Set the repetition alpha presence penalty (default: 0.0, 0.0 = disabled)

  39. def setRepeatLastN(repeatLastN: Int): T

    Set the last n tokens to consider for penalties (default: 64, 0 = disabled, -1 = ctx_size)

  40. def setRepeatPenalty(repeatPenalty: Float): T

    Set the penalty of repeated sequences of tokens (default: 1.0, 1.0 = disabled)

  41. def setSeed(seed: Int): T

    Set the RNG seed (default: -1, use random seed for < 0)

  42. def setStopStrings(stopStrings: ArrayList[String]): T
  43. def setStopStrings(stopStrings: Array[String]): T

    Set strings upon seeing which token generation is stopped

  44. def setSystemPrompt(systemPrompt: String): T
  45. def setTemperature(temperature: Float): T

    Set the temperature (default: 0.8)

  46. def setTfsZ(tfsZ: Float): T

    Set tail free sampling, parameter z (default: 1.0, 1.0 = disabled)

  47. def setTopK(topK: Int): T

    Set top-k sampling (default: 40, 0 = disabled)

  48. def setTopP(topP: Float): T

    Set top-p sampling (default: 0.9, 1.0 = disabled)

  49. def setTypicalP(typicalP: Float): T

    Set locally typical sampling, parameter p (default: 1.0, 1.0 = disabled)

  50. def setUseChatTemplate(useChatTemplate: Boolean): T

    Set whether or not generate should apply a chat template (default: false)

  51. final def synchronized[T0](arg0: ⇒ T0): T0
    Definition Classes
    AnyRef
  52. def toString(): String
    Definition Classes
    AnyRef → Any
  53. final def wait(): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  54. final def wait(arg0: Long, arg1: Int): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  55. final def wait(arg0: Long): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()

Inherited from AnyRef

Inherited from Any

Ungrouped