JSL_MedS_VLM_Reasoning_v1 (8B - q16)

Description

This a vision language model designed for medical document understanding and image based clinical reasoning. It processes medical images and accompanying text to identify clinical findings, summarize content, and answer structured questions.

Download Copy S3 URI

How to use

from sparknlp.base import *
from sparknlp_jsl.annotator import *
from sparknlp_jsl.utils import *
from pyspark.ml import Pipeline

prompt = """
Act as a senior clinical specialist and analyze this medical document. Perform the following steps in order:
1. Clinical Summary: Identify the patient's primary and secondary diagnoses, including any 'overlap' syndromes mentioned.
2. Medication Analysis Table: Create a table listing:
    * Medication Name
    * Dosage & Frequency
    * Clinical Justification: Explain why this specific drug is being used for this patient’s symptoms (e.g., link the vasodilators to the finger ulcers).
3. Conditional Logic & Alerts: Explicitly list any instructions that are 'prn' (as needed) or conditional (e.g., 'in case of...'). Identify any medications that require close monitoring for this patient's condition.
4. Visual Verification: Confirm if there are any handwritten notes or signatures that modify the printed instructions.
Please reason step-by-step before providing your final answer.
"""

input_df = vision_llm_preprocessor(
    spark=spark,
    images_path="images",
    prompt=prompt,
    output_col_name="prompt"
)

document_assembler = DocumentAssembler() \
    .setInputCol("prompt") \
    .setOutputCol("caption_document")

image_assembler = ImageAssembler() \
    .setInputCol("image") \
    .setOutputCol("image_assembler")

medicalVisionLLM = MedicalVisionLLM.pretrained("jsl_meds_vlm_reasoning_8b_q16_v1", "en", "clinical/models") \
    .setInputCols(["caption_document", "image_assembler"]) \
    .setOutputCol("completions")

pipeline = Pipeline().setStages([
    document_assembler,
    image_assembler,
    medicalVisionLLM
])

model = pipeline.fit(input_df)
result = model.transform(input_df)

from johnsnowlabs import nlp, medical
from sparknlp_jsl.utils import vision_llm_preprocessor

prompt = """
Act as a senior clinical specialist and analyze this medical document. Perform the following steps in order:
1. Clinical Summary: Identify the patient's primary and secondary diagnoses, including any 'overlap' syndromes mentioned.
2. Medication Analysis Table: Create a table listing:
    * Medication Name
    * Dosage & Frequency
    * Clinical Justification: Explain why this specific drug is being used for this patient’s symptoms (e.g., link the vasodilators to the finger ulcers).
3. Conditional Logic & Alerts: Explicitly list any instructions that are 'prn' (as needed) or conditional (e.g., 'in case of...'). Identify any medications that require close monitoring for this patient's condition.
4. Visual Verification: Confirm if there are any handwritten notes or signatures that modify the printed instructions.
Please reason step-by-step before providing your final answer.
"""

input_df = vision_llm_preprocessor(
    spark=spark,
    images_path="images",
    prompt=prompt,
    output_col_name="prompt"
)

document_assembler = nlp.DocumentAssembler() \
    .setInputCol("prompt") \
    .setOutputCol("caption_document")

image_assembler = nlp.ImageAssembler() \
    .setInputCol("image") \
    .setOutputCol("image_assembler")

medicalVisionLLM = medical.MedicalVisionLLM.pretrained("jsl_meds_vlm_reasoning_8b_q16_v1", "en", "clinical/models") \
    .setInputCols(["caption_document", "image_assembler"]) \
    .setOutputCol("completions")

pipeline = nlp.Pipeline().setStages([
    document_assembler,
    image_assembler,
    medicalVisionLLM
])

model = pipeline.fit(input_df)
result = model.transform(input_df)

import com.johnsnowlabs.nlp.base._
import com.johnsnowlabs.nlp.annotators._
import com.johnsnowlabs.nlp.pretrained._
import org.apache.spark.ml.Pipeline

val prompt = """
Act as a senior clinical specialist and analyze this medical document. Perform the following steps in order:
1. Clinical Summary: Identify the patient's primary and secondary diagnoses, including any 'overlap' syndromes mentioned.
2. Medication Analysis Table: Create a table listing:
    * Medication Name
    * Dosage & Frequency
    * Clinical Justification: Explain why this specific drug is being used for this patient’s symptoms (e.g., link the vasodilators to the finger ulcers).
3. Conditional Logic & Alerts: Explicitly list any instructions that are 'prn' (as needed) or conditional (e.g., 'in case of...'). Identify any medications that require close monitoring for this patient's condition.
4. Visual Verification: Confirm if there are any handwritten notes or signatures that modify the printed instructions.
Please reason step-by-step before providing your final answer.
"""

val inputDf = VisionLLMPreprocessor(
  spark = spark,
  imagesPath = "images",
  prompt = prompt,
  outputColName = "prompt"
)

val documentAssembler = new DocumentAssembler()
  .setInputCol("prompt")
  .setOutputCol("caption_document")

val imageAssembler = new ImageAssembler()
  .setInputCol("image")
  .setOutputCol("image_assembler")

val medicalVisionLLM = MedicalVisionLLM
  .pretrained("jsl_meds_vlm_reasoning_8b_q16_v1", "en", "clinical/models")
  .setInputCols(Array("caption_document", "image_assembler"))
  .setOutputCol("completions")

val pipeline = new Pipeline().setStages(Array(
  documentAssembler,
  imageAssembler,
  medicalVisionLLM
))

val model = pipeline.fit(inputDf)
val result = model.transform(inputDf)

Results

{
  "patient": {
    "name": "Ms RUKHSANA SHAHEEN",
    "age": "56 yrs",
    "sex": "Female",
    "hospital_no": "MH005990453",
    "episode_no": "030000528270",
    "episode_date": "02/07/2021 08:31AM"
  },
  "diagnoses": ["systemic lupus erythematosus", "scleroderma overlap", "interstitial lung disease"],
  "symptoms": ["tightness of skin of the fists", "ulcers on the pulp of the fingers"],
  "treatment": [
    {"med": "Linezolid", "dose": "600 mg", "freq": "twice a day for 5 Days"},
    {"med": "Clopidogrel", "dose": "75 mg", "freq": "once a day after meals"},
    {"med": "Amlodipine", "dose": "5 mg", "freq": "once a day"},
    {"med": "Domperidone", "dose": "10 mg", "freq": "twice a day before meals"},
    {"med": "Omeprazole", "dose": "20 Mg", "freq": "Twice a Day before Meal"},
    {"med": "Bosentan", "dose": "62.5 mg", "freq": "twice a day after meals"},
    {"med": "Sildenafil Citrate", "dose": "0.5 mg", "freq": "twice a day after meals"},
    {"med": "Prednisolone", "dose": "5 mg", "freq": "once a day after breakfast"},
    {"med": "Mycophenolate mofetil", "dose": "500 mg 2 tablets", "freq": "twice a day"},
    {"med": "L-methylfolate calcium", "dose": "400 µg 1 tablet", "freq": "once a day"},
    {"med": "ciprofloxacin", "dose": "250 mg", "freq": "twice a day"}
  ]
}

Model Information

Model Name:	jsl_meds_vlm_reasoning_8b_q16_v1
Compatibility:	Healthcare NLP 6.3.0+
License:	Licensed
Edition:	Official
Input Labels:	[image, document]
Output Labels:	[completions]
Language:	en
Size:	13.5 GB

PREVIOUSSentence Entity Resolver for Logical Observation Identifiers Names and Codes (LOINC) codes

NEXTJSL_MedS_VLM_Reasoning_v1 (8B - q4)