diff --git a/prompting/Prompting.ipynb b/prompting/Prompting.ipynb new file mode 100644 index 0000000..e5d407e --- /dev/null +++ b/prompting/Prompting.ipynb @@ -0,0 +1,793 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "hQQtgsnP-G9J" + }, + "source": [ + "

SRBED-10 [Prompt Engineering for Translation]

\n", + "\n", + "Task: create a prompt adapted to scientific domain (for scifact dataset), compare it with the default translation, see how it affects the translation quality\n", + "\n", + "All the results can be found in Data Translation Benchmark (google docs).\n" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "collapsed": true, + "id": "uN6T2p94I3b2", + "jupyter": { + "outputs_hidden": true + }, + "outputId": "1f069269-f1c4-46a9-83e8-51b3bc7e2b60" + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Collecting openai\n", + " Downloading openai-1.30.1-py3-none-any.whl.metadata (21 kB)\n", + "Requirement already satisfied: anyio<5,>=3.5.0 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from openai) (4.3.0)\n", + "Collecting distro<2,>=1.7.0 (from openai)\n", + " Downloading distro-1.9.0-py3-none-any.whl.metadata (6.8 kB)\n", + "Requirement already satisfied: httpx<1,>=0.23.0 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from openai) (0.27.0)\n", + "Requirement already satisfied: pydantic<3,>=1.9.0 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from openai) (2.6.4)\n", + "Requirement already satisfied: sniffio in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from openai) (1.3.1)\n", + "Collecting tqdm>4 (from openai)\n", + " Downloading tqdm-4.66.4-py3-none-any.whl.metadata (57 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m57.6/57.6 kB\u001b[0m \u001b[31m3.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hRequirement already satisfied: typing-extensions<5,>=4.7 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from openai) (4.10.0)\n", + "Requirement already satisfied: idna>=2.8 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from anyio<5,>=3.5.0->openai) (3.6)\n", + "Requirement already satisfied: certifi in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from httpx<1,>=0.23.0->openai) (2024.2.2)\n", + "Requirement already satisfied: httpcore==1.* in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from httpx<1,>=0.23.0->openai) (1.0.5)\n", + "Requirement already satisfied: h11<0.15,>=0.13 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from httpcore==1.*->httpx<1,>=0.23.0->openai) (0.14.0)\n", + "Requirement already satisfied: annotated-types>=0.4.0 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from pydantic<3,>=1.9.0->openai) (0.6.0)\n", + "Requirement already satisfied: pydantic-core==2.16.3 in /Users/nevenarokvic/myenv/lib/python3.12/site-packages (from pydantic<3,>=1.9.0->openai) (2.16.3)\n", + "Downloading openai-1.30.1-py3-none-any.whl (320 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m320.6/320.6 kB\u001b[0m \u001b[31m9.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading distro-1.9.0-py3-none-any.whl (20 kB)\n", + "Downloading tqdm-4.66.4-py3-none-any.whl (78 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m78.3/78.3 kB\u001b[0m \u001b[31m7.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hInstalling collected packages: tqdm, distro, openai\n", + "Successfully installed distro-1.9.0 openai-1.30.1 tqdm-4.66.4\n", + "Note: you may need to restart the kernel to use updated packages.\n" + ] + } + ], + "source": [ + "!pip install openai" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "collapsed": true, + "id": "PxV9GSTNJBFV", + "jupyter": { + "outputs_hidden": true + } + }, + "outputs": [ + { + "ename": "ModuleNotFoundError", + "evalue": "No module named 'google'", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", + "Cell \u001b[0;32mIn[2], line 2\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mopenai\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m OpenAI\n\u001b[0;32m----> 2\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mgoogle\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mcolab\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m userdata\n\u001b[1;32m 4\u001b[0m OPENAI_KEY \u001b[38;5;241m=\u001b[39m userdata\u001b[38;5;241m.\u001b[39mget(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mOPENAI_API_KEY\u001b[39m\u001b[38;5;124m'\u001b[39m)\n\u001b[1;32m 5\u001b[0m client \u001b[38;5;241m=\u001b[39m OpenAI(api_key\u001b[38;5;241m=\u001b[39mOPENAI_KEY)\n", + "\u001b[0;31mModuleNotFoundError\u001b[0m: No module named 'google'" + ] + } + ], + "source": [ + "from openai import OpenAI\n", + "from google.colab import userdata\n", + "\n", + "OPENAI_KEY = userdata.get('OPENAI_API_KEY')\n", + "client = OpenAI(api_key=OPENAI_KEY)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "vX9NA-PwMqa2" + }, + "outputs": [], + "source": [ + "def translate(query: str, model: str = 'gpt-4o') -> str:\n", + " \"\"\" Translate to Serbian via OPENAI API. \"\"\"\n", + "\n", + " response = client.chat.completions.create(\n", + " model=model,\n", + " messages=[\n", + " {\n", + " \"role\": \"system\",\n", + " \"content\": SYSTEM_PROMPT\n", + " },\n", + " {\n", + " \"role\": \"user\",\n", + " \"content\": query\n", + " }\n", + " ],\n", + " temperature=0.7,\n", + " top_p=1\n", + " )\n", + "\n", + " return response" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "sDKaMo-eqa6g" + }, + "source": [ + "### System prompt adapted to science domain\n", + "This prompt provides comprehensive instructions for translating scientific passages from English to Serbian (Latin script), emphasizing accuracy and consistency. The guidelines focus on precise translation of scientific terminology, correct handling of numeric data, preservation of context, consistency in terminology and formatting, and grammatical correctness. Additionally, it includes specific instructions with human-labeled examples highlighting common errors from default translations, such as ensuring that translated terms and their acronyms match the Serbian equivalents.\n", + "\n", + "\n", + "GPT-4o vs GPT-3.5 (for more details refer to Data Translation Benchmark):\n", + "\n", + "- Better translates abbreviations and correctly adds grammatical suffixes\n", + "- Translates some terms more naturally, capturing the essence of the language.\n", + "- Successfully translates abbreviations into Serbian when the original term exists (for example, it translates 'blood pressure - BP' as 'krvni pritisak - KP')\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "AHYkuKr4Maol" + }, + "outputs": [], + "source": [ + "SYSTEM_PROMPT = \"\"\"\n", + "I would like you to help me translate the provided passages from English into Serbian (Latin script).\n", + "\n", + "Since this is a scientific dataset, it is crucial to maintain accuracy and consistency in the translation. Please adhere to the following guidelines:\n", + "\n", + "1. **Accuracy of Terminology:**\n", + " - Ensure that all scientific terms and terminology are translated accurately and consistently.\n", + " - Use appropriate Serbian scientific terminology where applicable.\n", + " - Avoid using English terms when there is an appropriate Serbian term available\n", + "\n", + "2. **Numeric Data Integrity:**\n", + " - Keep all numeric data unchanged, including decimal points and numeric values.\n", + " - Verify that units of measurement are translated correctly and consistently according to Serbian language conventions.\n", + "\n", + "3. **Context Preservation:**\n", + " - Preserve the scientific context of the dataset to avoid misinterpretation.\n", + " - Ensure that the translation maintains the original meaning and context.\n", + "\n", + "4. **Consistency:**\n", + " - Maintain consistency in terminology, units, and formatting throughout the entire text.\n", + "\n", + "5. **Grammatical Accuracy:**\n", + " - Follow the grammatical rules of the Serbian language and make sure to use the correct declension when translating nouns, adjectives and pronouns.\n", + " - Ensure that the translation is grammatically correct and natural-sounding in Serbian\n", + " - If there is a term and its acronym present, they should be also translated to serbian. You can follow the guideline bellow:\n", + "\n", + " EXAMPLE (acronym):\n", + "\n", + " ENGLISH:\n", + " \"Epidemiologic analysis of family data on blood pressure (BP) is often compromised by the effects of antihypertensive medications.\"\n", + "\n", + " SERBIAN:\n", + " \"Epidemiološka analiza porodičnih podataka o krvnom pritisku (KP) često je ugrožena efektima antihipertenzivnih lekova.\"\n", + "\n", + " REASONING:\n", + " * The translation is correct because the term \"blood pressure\" is translated as \"krvni pritisak\" and the acronym BP is translated to KP, matching the Serbian term.\n", + "\n", + "\n", + "Translate the following dataset while adhering to these guidelines.\n", + "The output should be the translated passage from English to Serbian (Latin script).\n", + "\n", + "\"\"\"\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "bquRCdrIOLJw", + "outputId": "9ef60bb4-fc57-49fc-a1bf-85031874ae7c" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Identifikacija genomičkih elemenata potrebnih za vitalnost je centralna za naše razumevanje osnovne fiziologije bakterijskih patogena. Nedavno, kombinacija visokog intenziteta mutageneze i dubinskog sekvenciranja omogućila je identifikaciju gena koji su potrebni i uslovno potrebni u mnogim bakterijama. Geni, međutim, čine samo deo složenih genoma važnih bakterijskih patogena. Ovde koristimo nepristrasnu analizu kako bismo sveobuhvatno identifikovali genomski regione, uključujući gene, domene i intergeničke elemente, potrebne za optimalan rast Mycobacterium tuberculosis, važnog globalnog zdravstvenog patogena. Utvrdili smo da nekoliko proteina zajedno sadrži i domene potrebne za optimalan rast i domene koje su nepotrebne. Pored toga, mnoge nekodirajuće regione, uključujući regulatorne elemente i nekodirajuće RNK, su ključne za rast mikobakterija. Naša analiza pokazuje da su genetski zahtevi za rast složeniji nego što se može razumeti korišćenjem analize usmerene na gene.'" + ] + }, + "execution_count": 68, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"Identifying genomic elements required for viability is central to our understanding of the basic physiology of bacterial pathogens. Recently, the combination of high-density mutagenesis and deep sequencing has allowed for the identification of required and conditionally required genes in many bacteria. Genes, however, make up only a part of the complex genomes of important bacterial pathogens. Here, we use an unbiased analysis to comprehensively identify genomic regions, including genes, domains, and intergenic elements, required for the optimal growth of Mycobacterium tuberculosis, a major global health pathogen. We found that several proteins jointly contain both domains required for optimal growth and domains that are dispensable. In addition, many non-coding regions, including regulatory elements and non-coding RNAs, are critical for mycobacterial growth. Our analysis shows that the genetic requirements for growth are more complex than can be appreciated using gene-centric analysis.\"\n", + "\n", + "res = translate(query, model='gpt-3.5-turbo')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "EucajnyNY9Qx", + "outputId": "b9faa1c0-409e-40e9-fe21-2ac1b7879b08" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Identifikacija genetskih elemenata neophodnih za održivost je centralna za naše razumevanje osnovne fiziologije bakterijskih patogena. Nedavno su kombinacija visoko-gustinske mutageneze i dubokog sekvenciranja omogućile identifikaciju neophodnih i uslovno neophodnih gena kod mnogih bakterija. Geni, međutim, čine samo deo kompleksnih genoma važnih bakterijskih patogena. Ovde koristimo nepristrasnu analizu kako bismo sveobuhvatno identifikovali genomske regione, uključujući gene, domene i intergenske elemente, neophodne za optimalan rast Mycobacterium tuberculosis, glavnog globalnog zdravstvenog patogena. Otkrili smo da nekoliko proteina zajednički sadrži i domene potrebne za optimalan rast i domene koji su nepotrebni. Pored toga, mnoge nekodirajuće regije, uključujući regulatorne elemente i nekodirajuće RNK, su kritične za mikobakterijski rast. Naša analiza pokazuje da su genetski zahtevi za rast složeniji nego što se može shvatiti korišćenjem analize usmerene na gene.'" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"Identifying genomic elements required for viability is central to our understanding of the basic physiology of bacterial pathogens. Recently, the combination of high-density mutagenesis and deep sequencing has allowed for the identification of required and conditionally required genes in many bacteria. Genes, however, make up only a part of the complex genomes of important bacterial pathogens. Here, we use an unbiased analysis to comprehensively identify genomic regions, including genes, domains, and intergenic elements, required for the optimal growth of Mycobacterium tuberculosis, a major global health pathogen. We found that several proteins jointly contain both domains required for optimal growth and domains that are dispensable. In addition, many non-coding regions, including regulatory elements and non-coding RNAs, are critical for mycobacterial growth. Our analysis shows that the genetic requirements for growth are more complex than can be appreciated using gene-centric analysis.\"\n", + "\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "5RAw2bUj-FwZ" + }, + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 196 + }, + "id": "GioJStDOaYzF", + "outputId": "f3f50591-5a37-4f91-fb19-6f2ffcfdc15a" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Neuregulin 1 (NRG1) i njegov receptor ErbB4 su oba gena sklonosti šizofreniji. Međutim, malo se zna o osnovnom mehanizmu njihovog neispravnog funkcionisanja. Iako je ErbB4 obilno prisutan u GABAergičkim interneuronima, uloga NRG1 u formiranju egzitatornih sinapsi kod ovih neurona je slabo razumljiva. Pokazali smo da NRG1 povećava broj i veličinu PSD-95 puncta, frekvenciju i amplitudu minijaturnih EPSC-a (mEPSCs) u GABAergičkim interneuronima, što ukazuje da NRG1 stimuliše formiranje novih sinapsi i jačanje postojećih sinapsi. Nasuprot tome, tretman NRG1 nije imao nikakav uticaj na broj ili veličinu egzitatornih sinapsi u glutamatergičkim neuronima, što ukazuje da je njegov sinaptogeni efekat specifičan za GABAergičke interneurone. Tretman Ecto-ErbB4 je smanjio broj i veličinu egzitatornih sinapsi, što ukazuje da endogeni NRG1 može biti ključan za bazalno formiranje sinapsi. NRG1 bi mogao stimulisati stabilnost PSD-95 na način koji zahteva tirozin kinaznu aktivnost ErbB4. Konačno, brisanje ErbB4 kod interneurona parvalbumina pozitivnih dovelo je do smanjenja frekvencije i amplitude mEPSCs, pružajući in vivo dokaze da je ErbB4 važan u egzitatornom sinaptogenezi kod interneurona. Naša otkrića sugerišu novu sinaptogenu ulogu NRG1 u razvoju egzitatornih sinapsi, moguće putem stabilizacije PSD-95, a ovaj efekat je specifičan za GABAergičke interneurone. U svetlu povezanosti gena NRG1 i ErbB4 sa šizofrenijom i disfunkcijom GABAergičkog sistema kod ove bolesti, ovi rezultati pružaju uvid u njen potencijalni patološki mehanizam.'" + ] + }, + "execution_count": 52, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"Neuregulin 1 (NRG1) and its receptor ErbB4 are both susceptibility genes of schizophrenia. However, little is known about the underlying mechanisms of their malfunction. Although ErbB4 is enriched in GABAergic interneurons, the role of NRG1 in excitatory synapse formation in these neurons remains poorly understood. We showed that NRG1 increased both the number and size of PSD-95 puncta and the frequency and amplitude of miniature EPSCs (mEPSCs) in GABAergic interneurons, indicating that NRG1 stimulates the formation of new synapses and strengthens existing synapses. In contrast, NRG1 treatment had no effect on either the number or size of excitatory synapses in glutamatergic neurons, suggesting its synaptogenic effect is specific to GABAergic interneurons. Ecto-ErbB4 treatment diminished both the number and size of excitatory synapses, suggesting that endogenous NRG1 may be critical for basal synapse formation. NRG1 could stimulate the stability of PSD-95 in the manner that requires tyrosine kinase activity of ErbB4. Finally, deletion of ErbB4 in parvalbumin-positive interneurons led to reduced frequency and amplitude of mEPSCs, providing in vivo evidence that ErbB4 is important in excitatory synaptogenesis in interneurons. Together, our findings suggested a novel synaptogenic role of NRG1 in excitatory synapse development, possibly via stabilizing PSD-95, and this effect is specific to GABAergic interneurons. In light of the association of the genes of both NRG1 and ErbB4 with schizophrenia and dysfunction of GABAergic system in this disorder, these results provide insight into its potential pathological mechanism.\"\n", + "res = translate(query, model='gpt-3.5-turbo')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "9_hweOdqagKB", + "outputId": "c410678a-6503-4b9e-c288-906b165e57b9" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Neuregulin 1 (NRG1) i njegov receptor ErbB4 su geni predispozicije za šizofreniju. Međutim, malo se zna o osnovnim mehanizmima njihovog neispravnog rada. Iako je ErbB4 obogaćen u GABAergičkim interneronima, uloga NRG1 u formiranju ekscitatornih sinapsi u ovim neuronima još uvek nije dovoljno shvaćena. Pokazali smo da NRG1 povećava i broj i veličinu PSD-95 punkata, kao i učestalost i amplitudu minijaturnih EPSC-ova (mEPSC-ova) u GABAergičkim interneronima, što ukazuje da NRG1 stimuliše formiranje novih sinapsi i jača postojeće sinapse. Nasuprot tome, tretman NRG1 nije imao efekta na broj ili veličinu ekscitatornih sinapsi u glutamatergičkim neuronima, što sugeriše da je njegov sinaptogeni efekat specifičan za GABAergičke internerone. Tretman Ecto-ErbB4 smanjio je i broj i veličinu ekscitatornih sinapsi, što sugeriše da endogeni NRG1 može biti kritičan za bazalno formiranje sinapsi. NRG1 bi mogao da stimuliše stabilnost PSD-95 na način koji zahteva aktivnost tirozinske kinaze ErbB4. Konačno, delecija ErbB4 u parvalbumin-pozitivnim interneronima dovela je do smanjenja učestalosti i amplitude mEPSC-ova, pružajući in vivo dokaz da je ErbB4 važan u ekscitatornoj sinaptogenezi u interneronima. Zajedno, naši nalazi sugerišu novu sinaptogenu ulogu NRG1 u razvoju ekscitatornih sinapsi, verovatno putem stabilizacije PSD-95, i ovaj efekat je specifičan za GABAergičke internerone. U svetlu povezanosti gena NRG1 i ErbB4 sa šizofrenijom i disfunkcijom GABAergičkog sistema u ovom poremećaju, ovi rezultati pružaju uvid u njegov potencijalni patološki mehanizam.'" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"Neuregulin 1 (NRG1) and its receptor ErbB4 are both susceptibility genes of schizophrenia. However, little is known about the underlying mechanisms of their malfunction. Although ErbB4 is enriched in GABAergic interneurons, the role of NRG1 in excitatory synapse formation in these neurons remains poorly understood. We showed that NRG1 increased both the number and size of PSD-95 puncta and the frequency and amplitude of miniature EPSCs (mEPSCs) in GABAergic interneurons, indicating that NRG1 stimulates the formation of new synapses and strengthens existing synapses. In contrast, NRG1 treatment had no effect on either the number or size of excitatory synapses in glutamatergic neurons, suggesting its synaptogenic effect is specific to GABAergic interneurons. Ecto-ErbB4 treatment diminished both the number and size of excitatory synapses, suggesting that endogenous NRG1 may be critical for basal synapse formation. NRG1 could stimulate the stability of PSD-95 in the manner that requires tyrosine kinase activity of ErbB4. Finally, deletion of ErbB4 in parvalbumin-positive interneurons led to reduced frequency and amplitude of mEPSCs, providing in vivo evidence that ErbB4 is important in excitatory synaptogenesis in interneurons. Together, our findings suggested a novel synaptogenic role of NRG1 in excitatory synapse development, possibly via stabilizing PSD-95, and this effect is specific to GABAergic interneurons. In light of the association of the genes of both NRG1 and ErbB4 with schizophrenia and dysfunction of GABAergic system in this disorder, these results provide insight into its potential pathological mechanism.\"\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "5e0cKgADVFRY", + "outputId": "2316f9db-6930-41ed-8682-1d44b1408c5c" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Dugi nekodirajući RNK nuklearni paraspekularni sklopni transkript 1 (NEAT1) je prijavljen da je povećan i da je uključen u onkogeni rast i otpornost na lekove kod karcinoma nosne šupljine (NPC). Međutim, tačne uloge NEAT1 i njeni osnovni mehanizmi u otpornosti na lekove kod NPC-a ostaju uglavnom nejasni. U ovom istraživanju, ekspresije NEAT1, let-72-5p i Rsf-1 mRNA su detektovane reverznom transkripcijom-kvantitativnom polimeraznom lančanom reakcijom (RT-qPCR). Efekti NEAT1 i let-72-5p na proliferaciju ćelija i otpornost na cispaltin NPC ćelija su istraženi metodom 3-(4,5-dimetiltiazol-2-il)-2,5-difeniltetrazolijum bromid (MTT) i metodom 5-etinil-20-dezoksiridin (EdU). Analiza zapadnog blota je izvršena kako bi se detektovali nivoi proteina Rsf-1, Ras, p-Raf1, Raf1, p-MEK1, MEK1, p-ERK1/2 i ERK1/2. Istražen je ksienograftni tumorski test kako bi se razjasnila uloga NEAT1 uključena u rast tumora NPC u vivo. Utvrdili smo da je NEAT1 povećan, a let-7a-5p smanjen u NPC tkivima, kao i NPC ćelijskim linijama. Inhibicija NEAT1 značajno je potisnula otpornost na cispaltin NPC ćelija. Dokazano je da NEAT1 interaguje sa let-7a-5p. Pored toga, negativna korelacija između ekspresije NEAT1 i let-7a-5p je primećena u NPC tkivima. Rsf-1 je potvrđen kao cilj let-7a-5p. NEAT1 je značajno reverzovao inhibicioni efekat let-7q-5p na otpornost na cispaltin NPC ćelija in vitro. Dodatno, suzbijanje NEAT1 inhibiralo je Ras-MAPK putanju u NPC ćelijama. Suzbijanje NEAT1 je suzbilo rast tumora u prisustvu cispaltina in vivo. Uopšteno, ova saznanja sugeriraju da NEAT1/let-7a-5p osovina reguliše otpornost na cispaltin kod NPC-a ciljajući Rsf-1 i modulišući Ras-MAPK signalni put.'" + ] + }, + "execution_count": 63, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"The long non-coding RNA nuclear paraspeckle assembly transcript 1 (NEAT1) was reported to be upregulated and be involved in oncogenic growth and drug resistance in nasopharyngeal carcinoma (NPC). However, the exact roles of NEAT1 and its underlying mechanisms in the drug resistance of NPC remain largely unclear. In this study, the expressions of NEAT1, let-72-5p and Rsf-1 mRNA were detected by reverse transcription-quantitative polymerase chain reaction (RT-qPCR). The effects of NEAT1 and let-72-5p on cell proliferation and cisplatin resistance of NPC cells were investigated by 3-(4,5-dimethylthiazol-2-yl)-2,5-diphenyl tetrazolium bromide (MTT) assay and 5-ethynyl-20-deoxyuridine (EdU) assay. Western blot analysis was performed to detect the protein levels of Rsf-1, Ras, p-Raf1, Raf1, p-MEK1, MEK1, p-ERK1/2 and ERK1/2. Xenograft tumor assay was done to elucidate the role of NEAT1 involved in NPC tumor growth in vivo. We found that NEAT1 was upregulated and let-7a-5p was downregulated in NPC tissues, as well as NPC cell lines. Inhibition of NEAT1 markedly repressed the cisplatin resistance of NPC cells. NEAT1 was demonstrated to interact with let-7a-5p. Besides, a negative correlation between NEAT1 and let-7a-5p expression was observed in NPC tissues. Rsf-1 was confirmed as a target of let-7a-5p. NEAT1 remarkably reversed the inhibitory effect of let-7q-5p on the cisplatin resistance of NPC cells in vitro. Additionally, NEAT1 knockdown inhibited the Ras-MAPK pathway in NPC cells. NEAT1 knockdown suppressed tumor growth in the presence of cisplatin in vivo. Overall, these findings suggest that NEAT1/let-7a-5p axis regulates the cisplatin resistance in NPC by targeting Rsf-1 and modulating the Ras-MAPK signaling pathway.\"\n", + "res = translate(query, model='gpt-3.5-turbo')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "rMiqGfCcbcAc", + "outputId": "f14819b5-51ca-48d9-e2dd-9480bb640ad5" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Duga nekodirajuća RNA nuklearni paraspeckle assembly transcript 1 (NEAT1) je prijavljena kao upregulisana i uključena u onkogeni rast i otpornost na lekove kod nazofaringealnog karcinoma (NPC). Međutim, tačne uloge NEAT1 i njegovi osnovni mehanizmi u otpornosti na lekove kod NPC ostaju uglavnom nejasni. U ovoj studiji, izrazi NEAT1, let-72-5p i Rsf-1 mRNA su detektovani pomoću reverzne transkripcije-kvantitativne lančane reakcije polimeraze (RT-qPCR). Efekti NEAT1 i let-72-5p na proliferaciju ćelija i otpornost na cisplatin kod NPC ćelija su istraženi pomoću 3-(4,5-dimetiltiazol-2-il)-2,5-difenil tetrazolijum bromida (MTT) testa i 5-etinil-20-deoksiuridina (EdU) testa. Western blot analiza je izvedena da se detektuju nivoi proteina Rsf-1, Ras, p-Raf1, Raf1, p-MEK1, MEK1, p-ERK1/2 i ERK1/2. Xenograft tumor test je urađen da se razjasni uloga NEAT1 u rastu tumora NPC in vivo. Otkrili smo da je NEAT1 upregulisan, a let-7a-5p downregulisan u NPC tkivima, kao i u NPC ćelijskim linijama. Inhibicija NEAT1 je značajno potisnula otpornost NPC ćelija na cisplatin. Pokazano je da NEAT1 interaguje sa let-7a-5p. Pored toga, negativna korelacija između ekspresije NEAT1 i let-7a-5p je primećena u NPC tkivima. Rsf-1 je potvrđen kao meta let-7a-5p. NEAT1 je značajno poništio inhibitorni efekat let-7a-5p na otpornost NPC ćelija na cisplatin in vitro. Dodatno, knockdown NEAT1 je inhibirao Ras-MAPK put u NPC ćelijama. Knockdown NEAT1 je suprimirao rast tumora u prisustvu cisplatina in vivo. Sve u svemu, ovi nalazi sugerišu da NEAT1/let-7a-5p osa reguliše otpornost na cisplatin kod NPC ciljajući Rsf-1 i modulišući Ras-MAPK signalni put.'" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"The long non-coding RNA nuclear paraspeckle assembly transcript 1 (NEAT1) was reported to be upregulated and be involved in oncogenic growth and drug resistance in nasopharyngeal carcinoma (NPC). However, the exact roles of NEAT1 and its underlying mechanisms in the drug resistance of NPC remain largely unclear. In this study, the expressions of NEAT1, let-72-5p and Rsf-1 mRNA were detected by reverse transcription-quantitative polymerase chain reaction (RT-qPCR). The effects of NEAT1 and let-72-5p on cell proliferation and cisplatin resistance of NPC cells were investigated by 3-(4,5-dimethylthiazol-2-yl)-2,5-diphenyl tetrazolium bromide (MTT) assay and 5-ethynyl-20-deoxyuridine (EdU) assay. Western blot analysis was performed to detect the protein levels of Rsf-1, Ras, p-Raf1, Raf1, p-MEK1, MEK1, p-ERK1/2 and ERK1/2. Xenograft tumor assay was done to elucidate the role of NEAT1 involved in NPC tumor growth in vivo. We found that NEAT1 was upregulated and let-7a-5p was downregulated in NPC tissues, as well as NPC cell lines. Inhibition of NEAT1 markedly repressed the cisplatin resistance of NPC cells. NEAT1 was demonstrated to interact with let-7a-5p. Besides, a negative correlation between NEAT1 and let-7a-5p expression was observed in NPC tissues. Rsf-1 was confirmed as a target of let-7a-5p. NEAT1 remarkably reversed the inhibitory effect of let-7q-5p on the cisplatin resistance of NPC cells in vitro. Additionally, NEAT1 knockdown inhibited the Ras-MAPK pathway in NPC cells. NEAT1 knockdown suppressed tumor growth in the presence of cisplatin in vivo. Overall, these findings suggest that NEAT1/let-7a-5p axis regulates the cisplatin resistance in NPC by targeting Rsf-1 and modulating the Ras-MAPK signaling pathway.\"\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "7bwd4LKW4w9e", + "outputId": "6b0254b7-32a7-4b67-ff34-69908122fbfe" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Meksiko obiluje velikom kulturnom i etničkom raznolikošću, ali detaljni obrasci varijacija ljudskog genoma na ovoj teritoriji uglavnom nisu karakterisani. Pratili smo genomsku varijabilnost unutar Meksika kod preko 1000 jedinki koje predstavljaju 20 autohtonih i 11 mešanih populacija. Otkrili smo značajnu genetsku stratifikaciju među autohtonim populacijama u Meksiku na različitim stepenima geografske izolacije. Neke grupe su bile toliko diferencirane koliko su Evropljani različiti od Istočnih Azijata. Prekolumbovsku genetsku podstrukturu možemo videti u autohtonom nasleđu mešovitih meksičkih jedinki širom zemlje. Štaviše, dve nezavisno fenotipski određene kohorte Meksikanaca i Meksiko-Amerikanaca pokazale su značajnu asocijaciju između podkontinentalnog nasleđa i funkcije pluća. Stoga je bitno uzeti u obzir detaljne obrasce nasleđa za medicinska i populaciona genetička istraživanja unutar Meksika, kod populacija meksičkog porekla, kao i verovatno kod mnogih drugih populacija širom sveta.'" + ] + }, + "execution_count": 62, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"Mexico harbors great cultural and ethnic diversity, yet fine-scale patterns of human genome-wide variation from this region remain largely uncharacterized. We studied genomic variation within Mexico from over 1000 individuals representing 20 indigenous and 11 mestizo populations. We found striking genetic stratification among indigenous populations within Mexico at varying degrees of geographic isolation. Some groups were as differentiated as Europeans are from East Asians. Pre-Columbian genetic substructure is recapitulated in the indigenous ancestry of admixed mestizo individuals across the country. Furthermore, two independently phenotyped cohorts of Mexicans and Mexican Americans showed a significant association between subcontinental ancestry and lung function. Thus, accounting for fine-scale ancestry patterns is critical for medical and population genetic studies within Mexico, in Mexican-descent populations, and likely in many other populations worldwide.\"\n", + "res = translate(query, model='gpt-3.5-turbo')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "pzYDJy_8crUd", + "outputId": "be9811e0-6163-4ba2-a548-32931f44cac9" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Meksiko poseduje veliku kulturnu i etničku raznolikost, ali obrasci varijacija ljudskog genoma na finom nivou iz ovog regiona ostaju uglavnom nekarakterisani. Proučavali smo genetsku varijaciju unutar Meksika kod preko 1000 osoba koje predstavljaju 20 autohtonih i 11 mestizo populacija. Otkrili smo zapanjujuću genetsku stratifikaciju među autohtonim populacijama unutar Meksika u različitim stepenima geografske izolacije. Neke grupe su bile toliko diferencirane koliko su Evropljani različiti od Istočnih Azijata. Prekolumbijska genetska podstruktura se reprizira u autohtonom poreklu mešovitih mestizo osoba širom zemlje. Štaviše, dve nezavisno fenotipizirane kohorte Meksikanaca i Meksikano-Amerikanaca pokazale su značajnu povezanost između supkontinentalnog porekla i funkcije pluća. Dakle, uzimanje u obzir obrazaca porekla na finom nivou je kritično za medicinske i genetske studije populacija unutar Meksika, u populacijama meksičkog porekla, i verovatno u mnogim drugim populacijama širom sveta.'" + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"Mexico harbors great cultural and ethnic diversity, yet fine-scale patterns of human genome-wide variation from this region remain largely uncharacterized. We studied genomic variation within Mexico from over 1000 individuals representing 20 indigenous and 11 mestizo populations. We found striking genetic stratification among indigenous populations within Mexico at varying degrees of geographic isolation. Some groups were as differentiated as Europeans are from East Asians. Pre-Columbian genetic substructure is recapitulated in the indigenous ancestry of admixed mestizo individuals across the country. Furthermore, two independently phenotyped cohorts of Mexicans and Mexican Americans showed a significant association between subcontinental ancestry and lung function. Thus, accounting for fine-scale ancestry patterns is critical for medical and population genetic studies within Mexico, in Mexican-descent populations, and likely in many other populations worldwide.\"\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 214 + }, + "id": "NVW8VOXqCi93", + "outputId": "69414f1f-7e2b-423b-fed6-a3e1299738ae" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Rastvorni \"high Km\" 5\\'-nukleotidaza posteljice čoveka je odvojena od \"low Km\" 5\\'-nukleotidaze i nespecifične fosfataze pomoću AMP-Sepharose afinitetne hromatografije. Enzim je pročišćen 8000 puta do specifične aktivnosti od 25.6 mumol/min/mg. Molekulska masa podjedinice je 53 kDa, a molekulska masa u prirodnom stanju je 210 kDa, što sugerira tetramernu strukturu. Rastvorna visoka Km 5\\'-nukleotidaza je najaktivnija sa IMP i GMP i njihovim dezoksi derivatima. IMP se hidrolizuje 15 puta brže od AMP. Enzim ima skoro apsolutnu potrebu za jonskim magnezijumom i regulisan je od strane njih. Purinske nukleozid 5\\'-trifosfati snažno aktiviraju enzim sa redosledom efikasnosti dATP veće od ATP veće od GTP. 2,3-Difosfoglicerat aktivira enzim jednako snažno kao ATP. Tri milimola ATP smanjuju Km za IMP sa 0.33 na 0.09 mM i povećavaju Vmax 12 puta. Aktivacija ATP-om je modifikovana koncentracijom IMP-a. Na 20 mikromola IMP-a, kriva zavisnosti od ATP-a je sigmoidna, dok je na 2 mM IMP-a hiperbolična. A0.5 vrednosti za ATP su 2.26 i 0.70 mM, a relativne maksimalne brzine su 32.9 i 126.0 nmol/min, redom. Anorganski fosfat pomera hiperbolični odnos brzine supstrata za IMP u sigmoidni. Sa fiziološkim koncentracijama koenzima (3 mM ATP, 1-4 mM Pi, 150 mM KCl) na pH 7.4, enzim je 25-35 puta aktivniji prema 100 mikromola IMP-a nego prema 100 mikromola AMP-a. Ovi podaci pokazuju da: (a) rastvorna visoka Km 5\\'-nukleotidaza posteljice čoveka koegzistira u ljudskoj posteljici sa enzimom niske Km; (b) pod fiziološkim uslovima, enzim favorizuje hidrolizu IMP-a i kritično je regulisan od strane IMP-a, ATP-a i Pi nivoa; i (c) kinetičke osobine ATP-a i IMP-a su modifikovane od strane drugog jedinjenja, sugerišući kompleksnu interakciju povezanih vezivnih mesta.'" + ] + }, + "execution_count": 70, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = (\n", + " \"A human placental soluble \\\"high Km\\\" 5'-nucleotidase has been separated from \\\"low Km\\\" 5'-nucleotidase and nonspecific \"\n", + " \"phosphatase by AMP-Sepharose affinity chromatography. The enzyme was purified 8000-fold to a specific activity of 25.6 mumol/min/mg. \"\n", + " \"The subunit molecular mass is 53 kDa, and the native molecular mass is 210 kDa, suggesting a tetrameric structure. Soluble high Km 5'-nucleotidase \"\n", + " \"is most active with IMP and GMP and their deoxy derivatives. IMP is hydrolyzed 15 times faster than AMP. The enzyme has a virtually absolute requirement \"\n", + " \"for magnesium ions and is regulated by them. Purine nucleoside 5'-triphosphates strongly activate the enzyme with the potency order dATP greater than ATP \"\n", + " \"greater than GTP. 2,3-Diphosphoglycerate activates the enzyme as potently as ATP. Three millimolar ATP decreased the Km for IMP from 0.33 to 0.09 mM and \"\n", + " \"increased the Vmax 12-fold. ATP activation was modified by the IMP concentration. At 20 microM IMP the ATP-dependent activation curve was sigmoidal, \"\n", + " \"while at 2 mM IMP it was hyperbolic. The A0.5 values for ATP were 2.26 and 0.70 mM, and the relative maximal velocities were 32.9 and 126.0 nmol/min, \"\n", + " \"respectively. Inorganic phosphate shifts the hyperbolic substrate velocity relationship for IMP to a sigmoidal one. With physiological concentrations of \"\n", + " \"cofactors (3 mM ATP, 1-4 mM Pi, 150 mM KCl) at pH 7.4, the enzyme is 25-35 times more active toward 100 microM IMP than 100 microM AMP. These data show \"\n", + " \"that: (a) soluble human placental high Km 5'-nucleotidase coexists in human placenta with the low Km enzyme; (b) under physiological conditions the enzyme \"\n", + " \"favors the hydrolysis of IMP and is critically regulated by IMP, ATP, and Pi levels; and (c) kinetic properties of ATP and IMP are each modified by the other \"\n", + " \"compound suggesting complex interaction of the associated binding sites.\"\n", + ")\n", + "res = translate(query, model='gpt-3.5-turbo')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "ZeXxvAnKez_q", + "outputId": "35d46aed-bff5-4867-ddaa-af39ff290ef5" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Topiva ljudska placentna rastvorljiva \"visokog Km\" 5\\'-nukleotidaza je odvojena od \"niskog Km\" 5\\'-nukleotidaze i nespecifične fosfataze pomoću AMP-Sepharose afinitetne hromatografije. Enzim je pročišćen 8000 puta do specifične aktivnosti od 25,6 mumol/min/mg. Molekulska masa podjedinica je 53 kDa, a nativna molekulska masa je 210 kDa, što sugeriše tetramernu strukturu. Rastvorljiva visokog Km 5\\'-nukleotidaza je najaktivnija sa IMP i GMP i njihovim deoksi derivatima. IMP se hidrolizuje 15 puta brže od AMP. Enzim ima gotovo apsolutnu potrebu za magnezijumovim jonima i reguliše se njima. Purinski nukleozid 5\\'-trifosfati snažno aktiviraju enzim sa sledećim redosledom potencije: dATP veći od ATP veći od GTP. 2,3-Difosfoglicerat aktivira enzim jednako snažno kao ATP. Tri milimolara ATP smanjuje Km za IMP sa 0,33 na 0,09 mM i povećava Vmax 12 puta. Aktivacija ATP-a je modifikovana koncentracijom IMP. Na 20 mikroM IMP, ATP-zavisna kriva aktivacije je sigmoidna, dok je na 2 mM IMP hiperbolična. A0.5 vrednosti za ATP su 2,26 i 0,70 mM, a relativne maksimalne brzine su 32,9 i 126,0 nmol/min, respektivno. Neorganski fosfat prebacuje hiperboličnu zavisnost brzine supstrata za IMP u sigmoidnu. Sa fiziološkim koncentracijama kofaktora (3 mM ATP, 1-4 mM Pi, 150 mM KCl) na pH 7,4, enzim je 25-35 puta aktivniji prema 100 mikroM IMP nego prema 100 mikroM AMP. Ovi podaci pokazuju da: (a) rastvorljiva ljudska placentna visokog Km 5\\'-nukleotidaza koegzistira u ljudskoj placenti sa enzimom niskog Km; (b) pod fiziološkim uslovima enzim favorizuje hidrolizu IMP i kritično se reguliše nivoima IMP, ATP i Pi; i (c) kinetička svojstva ATP-a i IMP-a su međusobno modifikovana, što sugeriše složenu interakciju povezanih vezivnih mesta.'" + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = (\n", + " \"A human placental soluble \\\"high Km\\\" 5'-nucleotidase has been separated from \\\"low Km\\\" 5'-nucleotidase and nonspecific \"\n", + " \"phosphatase by AMP-Sepharose affinity chromatography. The enzyme was purified 8000-fold to a specific activity of 25.6 mumol/min/mg. \"\n", + " \"The subunit molecular mass is 53 kDa, and the native molecular mass is 210 kDa, suggesting a tetrameric structure. Soluble high Km 5'-nucleotidase \"\n", + " \"is most active with IMP and GMP and their deoxy derivatives. IMP is hydrolyzed 15 times faster than AMP. The enzyme has a virtually absolute requirement \"\n", + " \"for magnesium ions and is regulated by them. Purine nucleoside 5'-triphosphates strongly activate the enzyme with the potency order dATP greater than ATP \"\n", + " \"greater than GTP. 2,3-Diphosphoglycerate activates the enzyme as potently as ATP. Three millimolar ATP decreased the Km for IMP from 0.33 to 0.09 mM and \"\n", + " \"increased the Vmax 12-fold. ATP activation was modified by the IMP concentration. At 20 microM IMP the ATP-dependent activation curve was sigmoidal, \"\n", + " \"while at 2 mM IMP it was hyperbolic. The A0.5 values for ATP were 2.26 and 0.70 mM, and the relative maximal velocities were 32.9 and 126.0 nmol/min, \"\n", + " \"respectively. Inorganic phosphate shifts the hyperbolic substrate velocity relationship for IMP to a sigmoidal one. With physiological concentrations of \"\n", + " \"cofactors (3 mM ATP, 1-4 mM Pi, 150 mM KCl) at pH 7.4, the enzyme is 25-35 times more active toward 100 microM IMP than 100 microM AMP. These data show \"\n", + " \"that: (a) soluble human placental high Km 5'-nucleotidase coexists in human placenta with the low Km enzyme; (b) under physiological conditions the enzyme \"\n", + " \"favors the hydrolysis of IMP and is critically regulated by IMP, ATP, and Pi levels; and (c) kinetic properties of ATP and IMP are each modified by the other \"\n", + " \"compound suggesting complex interaction of the associated binding sites.\"\n", + ")\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 107 + }, + "id": "Z4XYY7cQoDRR", + "outputId": "8915b1eb-3a60-417c-d774-f7d577528af4" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "\"NEOZNAČENI MesoRD je alat za stohastičku simulaciju hemijskih reakcija i difuzije. Konkretno, to je implementacija metode sledeće subvolumena, koja je tačna metoda za simulaciju Markovljevog procesa koji odgovara reakcioni-difuzionoj master jednačini. DOSTUPNOST MesoRD je besplatan softver napisan u C++ programskom jeziku i licenciran pod GNU opštom javnom licencom (GPL). MesoRD radi na Linuxu, Mac OS X-u, NetBSD-u, Solarisu i Windows XP-u. Može se preuzeti sa http://mesord.sourceforge.net. KONTAKT johan.elf@icm.uu.se; johan.hattne@embl-hamburg.de DODATNE INFORMACIJE 'MesoRD Vodič za korisnike' i drugi dokumenti su dostupni na http://mesord.sourceforge.net.\"" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = (\n", + " \"UNLABELLED MesoRD is a tool for stochastic simulation of chemical reactions and diffusion. \"\n", + " \"In particular, it is an implementation of the next subvolume method, which is an exact method to simulate the Markov process corresponding to the reaction-diffusion master equation. \"\n", + " \"AVAILABILITY MesoRD is free software, written in C++ and licensed under the GNU general public license (GPL). \"\n", + " \"MesoRD runs on Linux, Mac OS X, NetBSD, Solaris and Windows XP. It can be downloaded from http://mesord.sourceforge.net. \"\n", + " \"CONTACT johan.elf@icm.uu.se; johan.hattne@embl-hamburg.de \"\n", + " \"SUPPLEMENTARY INFORMATION 'MesoRD User's Guide' and other documents are available at http://mesord.sourceforge.net.\"\n", + ")\n", + "res = translate(query, model='gpt-3.5-turbo')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 107 + }, + "id": "R1G_9CfflNGR", + "outputId": "b819df75-0a22-4938-f51e-045133be73fe" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "\"NEOZNAČENO MesoRD je alat za stohastičku simulaciju hemijskih reakcija i difuzije. Konkretno, to je implementacija metode sledećeg podzapreminskog pristupa, koja je tačna metoda za simulaciju Markovljevog procesa koji odgovara glavnoj jednačini reakcije-difuzije. DOSTUPNOST MesoRD je besplatan softver, napisan u C++ i licenciran pod GNU opštom javnom licencom (GPL). MesoRD radi na Linux-u, Mac OS X, NetBSD, Solaris-u i Windows XP-u. Može se preuzeti sa http://mesord.sourceforge.net. KONTAKT johan.elf@icm.uu.se; johan.hattne@embl-hamburg.de DODATNE INFORMACIJE 'MesoRD Korisnički vodič' i drugi dokumenti dostupni su na http://mesord.sourceforge.net.\"" + ] + }, + "execution_count": 35, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = (\n", + " \"UNLABELLED MesoRD is a tool for stochastic simulation of chemical reactions and diffusion. \"\n", + " \"In particular, it is an implementation of the next subvolume method, which is an exact method to simulate the Markov process corresponding to the reaction-diffusion master equation. \"\n", + " \"AVAILABILITY MesoRD is free software, written in C++ and licensed under the GNU general public license (GPL). \"\n", + " \"MesoRD runs on Linux, Mac OS X, NetBSD, Solaris and Windows XP. It can be downloaded from http://mesord.sourceforge.net. \"\n", + " \"CONTACT johan.elf@icm.uu.se; johan.hattne@embl-hamburg.de \"\n", + " \"SUPPLEMENTARY INFORMATION 'MesoRD User's Guide' and other documents are available at http://mesord.sourceforge.net.\"\n", + ")\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 232 + }, + "id": "jyUqdDNOsqjP", + "outputId": "49c3f708-4bf7-48b2-e149-9e70f9f4897e" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'POZADINA Epidemiološka analiza porodičnih podataka o krvnom pritisku (KP) često je ugrožena efektima antihipertenzivnih lekova. Pregled brojnih kliničkih ispitivanja koja su istraživala efekte lekova za snižavanje KP je ovde sažet. METODE Pregledana su objavljena klinička ispitivanja, uključujući 137 kliničkih ispitivanja sa monoterapijama i 28 kliničkih ispitivanja kombinovanih terapija sa ukupno 11,739 učesnika, iz PubMed-a. Šest glavnih klasa/grupa antihipertenzivnih lekova svrstano je prema etničkoj pripadnosti, uključujući inhibitore enzima koji konvertuje angiotenzin (ACE), alfa1-blokatore, kardioselektivne beta-blokatore (beta1-blokatore), blokatore kalcijumskih kanala, tiazidne i tiazidima slične diuretike, i diuretike Henleove petlje. REZULTATI Koristeći sedeći ili ležeći KP, za kombinovane etničke grupe, monoterapija sa ACE inhibitorima pokazala je ponderisani prosečan efekat snižavanja sistolnog i dijastolnog KP za 12.5/9.5 mm Hg; alfa1-blokatori za 15.5/11.7 mm Hg; beta1-blokatori za 14.8/12.2 mm Hg; blokatori kalcijumskih kanala za 15.3/10.5 mm Hg; tiazidni diuretici za 15.3/9.8 mm Hg; i diuretici Henleove petlje za 15.8/8.2 mm Hg. Međutim, ACE inhibitori, alfa1-blokatori i beta1-blokatori su bili manje efikasni kod Afroamerikanaca nego kod ne-Afroamerikanaca, dok su blokatori kalcijumskih kanala, tiazidni diuretici i diuretici Henleove petlje bili efikasniji kod Afroamerikanaca nego kod ne-Afroamerikanaca. Za kombinovanu terapiju sa dva leka kod kombinovanih etničkih grupa, efekat snižavanja KP kod drugog leka, u poređenju sa njegovim efektom kao monoterapije, bio je 84% i 65% za sistolni i dijastolni KP, respektivno. ZAKLJUČCI Efekti snižavanja KP navedeni ovde mogu se koristiti za imputaciju nivoa KP pre tretmana, što može poboljšati sadržaj informacija i time snagu epidemiološke analize u studijama gde je upotreba antihipertenzivnih lekova zbunjujući faktor u merenjima KP.'" + ] + }, + "execution_count": 24, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"BACKGROUND Epidemiologic analysis of family data on blood pressure (BP) is often compromised by the effects of antihypertensive medications. A review of numerous clinical trials that investigated the effects of BP-lowering medications is summarized here. METHODS Published clinical trials, including 137 clinical trials with monodrug therapies and 28 clinical trials of combination drug therapies with a total of 11,739 participants, were reviewed from PubMed. Six major classes/groups of antihypertensive medications were categorized by ethnicity, including angiotensin-converting enzyme (ACE) inhibitors, alpha1-blockers, cardioselective beta-blockers (beta1-blockers), calcium channel blockers, thiazide and thiazide-like diuretics, and loop diuretics. RESULTS Using sitting or supine BP, for ethnic groups combined, monodrug therapy with ACE inhibitors showed a weighted average effect of lowering the systolic and diastolic BP by 12.5/9.5 mm Hg; alpha1-blockers by 15.5/11.7 mm Hg; beta1-blockers by 14.8/12.2 mm Hg; calcium channel blockers by 15.3/10.5 mm Hg; thiazide diuretics by 15.3/9.8 mm Hg; and loop diuretics by 15.8/8.2 mm Hg. However, ACE inhibitors, alpha1-blockers, and beta1-blockers were less effective in African Americans than in non-African Americans, whereas calcium channel blockers, thiazide diuretics, and loop diuretics were more effective in African Americans than in non-African Americans. For two-drug combination therapy with ethnic groups combined, the BP-lowering effect of the second medication, when compared to its effect as monodrug therapy, was 84% and 65% for systolic and diastolic BP, respectively. CONCLUSIONS The BP-lowering effects reported here may be used to impute the pretreatment BP levels, which can improve the information content and hence the power of epidemiologic analysis in studies where use of antihypertensive medications is a confounding factor in the BP measurements.\"\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 143 + }, + "id": "sv7xxuwdisRv", + "outputId": "047e74c1-c056-4c9c-cf33-6299628e57e1" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Kompleks COMPASS koji sadrži Set1, a koji je kvasčev homolog ljudskog MLL kompleksa, potreban je za mono-, di- i trimetilaciju lizina 4 histona H3. Izvršili smo komparativni globalni proteomski skrining kako bismo bolje definisali ulogu kompleksa COMPASS u trimetilaciji histona. Izveštavamo da su i komponente Cps60 i Cps40 kompleksa COMPASS potrebne za pravilnu trimetilaciju histona H3, ali ne i za pravilnu regulaciju ćutanja gena povezanih sa telomerima. Pročišćeni kompleks COMPASS koji nedostaje Cps60 može vršiti mono- i dimetilaciju, ali nije sposoban za trimetilaciju H3(K4). Studije imunoprecipitacije hromatina (ChIP) ukazuju na to da gubitak podjedinica kompleksa COMPASS koje su potrebne za trimetilaciju histona ne utiče na lokalizaciju Set1 na hromatin za testirane gene. Zajedno, naši rezultati sugerišu molekularnu potrebu za nekoliko komponenti kompleksa COMPASS za pravilnu trimetilaciju histona H3 i regulaciju ekspresije gena povezanih sa telomerima, ukazujući na višestruke uloge različitih oblika metilacije histona od strane kompleksa COMPASS.'" + ] + }, + "execution_count": 25, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"The Set1-containing complex COMPASS, which is the yeast homolog of the human MLL complex, is required for mono-, di-, and trimethylation of lysine 4 of histone H3. We have performed a comparative global proteomic screen to better define the role of COMPASS in histone trimethylation. We report that both Cps60 and Cps40 components of COMPASS are required for proper histone H3 trimethylation, but not for proper regulation of telomere-associated gene silencing. Purified COMPASS lacking Cps60 can mono- and dimethylate but is not capable of trimethylating H3(K4). Chromatin immunoprecipitation (ChIP) studies indicate that the loss subunits of COMPASS required for histone trimethylation do not affect the localization of Set1 to chromatin for the genes tested. Collectively, our results suggest a molecular requirement for several components of COMPASS for proper histone H3 trimethylation and regulation of telomere-associated gene expression, indicating multiple roles for different forms of histone methylation by COMPASS.\"\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 89 + }, + "id": "00HbxY-GjGF4", + "outputId": "382955c5-d11f-4313-e8c0-e9bb82c52560" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "'Izveštavamo o jednostavnom metodu, koristeći supresiju p53 i netransformišući L-Myc, za generisanje ljudskih indukovanih pluripotentnih matičnih ćelija (iPSCs) sa epizomalnim plazmidnim vektorima. Generisali smo ljudske iPSCs od više donora, uključujući dva pretpostavljena donora homozigotna za ljudski leukocitni antigen (HLA), koji odgovaraju ∼20% japanske populacije na glavnim HLA lokusima; većina iPSCs su bez integrisanih transgena. Ovaj metod može obezbediti iPSCs pogodne za autologne i alologne terapije matičnim ćelijama u budućnosti.'" + ] + }, + "execution_count": 26, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"We report a simple method, using p53 suppression and nontransforming L-Myc, to generate human induced pluripotent stem cells (iPSCs) with episomal plasmid vectors. We generated human iPSCs from multiple donors, including two putative human leukocyte antigen (HLA)-homozygous donors who match ∼20% of the Japanese population at major HLA loci; most iPSCs are integrated transgene-free. This method may provide iPSCs suitable for autologous and allologous stem-cell therapy in the future.\"\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 125 + }, + "id": "oqYWm1FHkJsC", + "outputId": "73087a70-1f85-4df0-ad44-679e480bdeec" + }, + "outputs": [ + { + "data": { + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "string" + }, + "text/plain": [ + "\"Imunološko pamćenje je kardinalna karakteristika adaptivnog imuniteta i važan cilj vakcinacionih strategija. Ovde ističemo napredak u razumevanju različitih podskupina T limfocita koje pružaju akutnu i dugoročnu zaštitu od infekcija. Ovo uključuje nove uvide u transkripcione faktore i uzvodne 'pionirske' faktore koji regulišu njihovu dostupnost ključnim mestima regulacije gena, kao i metaboličke regulatore koji doprinose diferencijaciji efektorskih i memorijskih podskupina; ontogenezu i definisanje karakteristika tkivno-rezidentnih memorijskih limfocita; i poreklo izuzetne heterogenosti koju ispoljavaju aktivirani T ćelije. Kolektivno, ovi nalazi naglašavaju napredak u razjašnjavanju osnovnih puteva koji kontrolišu diverzifikaciju odgovora T ćelija, ali takođe otkrivaju praznine u znanju, kao i izazove koji se javljaju u primeni ovog znanja kako bi se racionalno izazvali željeni odgovori T ćelija putem vakcinacije i imunoterapije.\"" + ] + }, + "execution_count": 36, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "query = \"Immunological memory is a cardinal feature of adaptive immunity and an important goal of vaccination strategies. Here we highlight advances in the understanding of the diverse T lymphocyte subsets that provide acute and long-term protection from infection. These include new insights into the transcription factors, and the upstream 'pioneering' factors that regulate their accessibility to key sites of gene regulation, as well as metabolic regulators that contribute to the differentiation of effector and memory subsets; ontogeny and defining characteristics of tissue-resident memory lymphocytes; and origins of the remarkable heterogeneity exhibited by activated T cells. Collectively, these findings underscore progress in delineating the underlying pathways that control diversification in T cell responses but also reveal gaps in the knowledge, as well as the challenges that arise in the application of this knowledge to rationally elicit desired T cell responses through vaccination and immunotherapy.\"\n", + "res = translate(query, model='gpt-4o')\n", + "res.choices[0].message.content" + ] + } + ], + "metadata": { + "colab": { + "provenance": [] + }, + "kernelspec": { + "display_name": "Python (myenv)", + "language": "python", + "name": "myenv" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.12.2" + } + }, + "nbformat": 4, + "nbformat_minor": 4 +}