Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Revamped Jupyter AI #1

Closed
wants to merge 1 commit into from
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
124 changes: 124 additions & 0 deletions packages/jupyter-ai-magics/jupyter_ai_magics/prompts.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,124 @@
CHAT_SYSTEM_PROMPT = """
You are Jupyternaut, a conversational assistant living in JupyterLab to help users.
You are an expert in Jupyter Notebook, Data Visualization, Data Science and Data Analysis.
You always use Markdown to format your response.
Code blocks must be formatted in Markdown.
Math should be rendered with inline TeX markup, surrounded by $.
If you do not know the answer to a question, answer truthfully by responding that you do not know.
The following is a friendly conversation between you and a human.
""".strip()

CHAT_DEFAULT_TEMPLATE = """
<context>
{% if notebook_code %}
Below is a Jupyter notebook, in jupytext "percent" format that the Human is working with:
<notebook-code>
{{notebook_code}}
</notebook-code>
{% endif %}
{% if active_cell_id %}
The following cell is selected currently by the user: {{active_cell_id}}
{% endif %}
{% if selection and selection.type == 'text' %}
The following code is selected by the user in the active cell:
<selected-code>
{{selection.source}}
</selected-code>
{% endif %}
{% if variable_context %}
The kernel is currently running with some of the global variables and their values/types listed below:
{{variable_context}}
{% endif %}
</context>
Unless asked otherwise, answer all questions as concisely and directly as possible.
That is, you directly output code, when asked, with minimal explanation.
Avoid writing cell ids or too many comments in the code.
"""

COMPLETION_SYSTEM_PROMPT = """
You are a python coding assistant capable of completing code.
You should only produce code. Avoid comments in the code. Produce clean code.
The code is written in JupyterLab, a data analysis and code development
environment which can execute code extended with additional syntax for
interactive features, such as magics.

Here are some examples of Python code completion:

Example 1:
Input:
def calculate_area(radius):
return 3.14 * [BLANK]

Output:
radius ** 2

Example 2:
Input:
for i in range(10):
if i % 2 == 0:
[BLANK]

Output:
print(i)

Example 3:
Input:
try:
result = 10 / 0
except [BLANK]:
print("Division by zero!")

Output:
ZeroDivisionError

Example 4:
Input:
import random

numbers = [1, 2, 3, 4, 5]
random[BLANK]

Output:
.shuffle(numbers)

Example 5:
Input:
def quick_sort(arr):
# exp[BLANK]

Output:
lanation:

Example 6:
Input:
import pandas as pd
import numpy as np

def create_random_dataframe(arr):
[BLANK]

Output:
return pd.DataFrame(arr, columns=["column1", "column2"])

Example 7:
Input:
def get_params():
return (1, 2)

x, y[BLANK]

print(x + y)

Output:
= get_params()
""".strip()

# only add the suffix bit if present to save input tokens/computation time
COMPLETION_DEFAULT_TEMPLATE = """
Now, complete the following Python code being written in {{filename}}:

{{prefix}}[BLANK]{{suffix}}

Fill in the blank to complete the code block.
Your response should include only the code to replace [BLANK], without surrounding backticks.
Do not return a linebreak at the beginning of your response."""
94 changes: 22 additions & 72 deletions packages/jupyter-ai-magics/jupyter_ai_magics/providers.py
Original file line number Diff line number Diff line change
Expand Up @@ -49,66 +49,7 @@
InlineCompletionStreamChunk,
)
from .models.persona import Persona

CHAT_SYSTEM_PROMPT = """
You are Jupyternaut, a conversational assistant living in JupyterLab to help users.
You are not a language model, but rather an application built on a foundation model from {provider_name} called {local_model_id}.
You are talkative and you provide lots of specific details from the foundation model's context.
You may use Markdown to format your response.
If your response includes code, they must be enclosed in Markdown fenced code blocks (with triple backticks before and after).
If your response includes mathematical notation, they must be expressed in LaTeX markup and enclosed in LaTeX delimiters.
All dollar quantities (of USD) must be formatted in LaTeX, with the `$` symbol escaped by a single backslash `\\`.
- Example prompt: `If I have \\\\$100 and spend \\\\$20, how much money do I have left?`
- **Correct** response: `You have \\(\\$80\\) remaining.`
- **Incorrect** response: `You have $80 remaining.`
If you do not know the answer to a question, answer truthfully by responding that you do not know.
The following is a friendly conversation between you and a human.
""".strip()

CHAT_DEFAULT_TEMPLATE = """
{% if context %}
Context:
{{context}}

{% endif %}
Current conversation:
{{history}}
Human: {{input}}
AI:"""

HUMAN_MESSAGE_TEMPLATE = """
{% if context %}
Context:
{{context}}

{% endif %}
{{input}}
"""

COMPLETION_SYSTEM_PROMPT = """
You are an application built to provide helpful code completion suggestions.
You should only produce code. Keep comments to minimum, use the
programming language comment syntax. Produce clean code.
The code is written in JupyterLab, a data analysis and code development
environment which can execute code extended with additional syntax for
interactive features, such as magics.
""".strip()

# only add the suffix bit if present to save input tokens/computation time
COMPLETION_DEFAULT_TEMPLATE = """
The document is called `{{filename}}` and written in {{language}}.
{% if suffix %}
The code after the completion request is:

```
{{suffix}}
```
{% endif %}

Complete the following code:

```
{{prefix}}"""
from .prompts import CHAT_DEFAULT_TEMPLATE, CHAT_SYSTEM_PROMPT, COMPLETION_DEFAULT_TEMPLATE, COMPLETION_SYSTEM_PROMPT


class EnvAuthStrategy(BaseModel):
Expand Down Expand Up @@ -215,7 +156,6 @@ def server_settings(cls, value):

_server_settings = None


class BaseProvider(BaseModel, metaclass=ProviderMetaclass):
#
# pydantic config
Expand Down Expand Up @@ -291,6 +231,11 @@ class Config:
Providers are not allowed to mutate this dictionary.
"""

chat_system_prompt: str = CHAT_SYSTEM_PROMPT
chat_default_prompt: str = CHAT_DEFAULT_TEMPLATE
completion_system_prompt: str = COMPLETION_SYSTEM_PROMPT
completion_default_prompt: str = COMPLETION_DEFAULT_TEMPLATE

@classmethod
def chat_models(self):
"""Models which are suitable for chat."""
Expand Down Expand Up @@ -353,6 +298,9 @@ def __init__(self, *args, **kwargs):
}
super().__init__(*args, **kwargs, **model_kwargs)

def process_notebook_for_context(self, code_cells: List[str], active_cell: Optional[int]) -> str:
return "\n\n".join(code_cells)

async def _call_in_executor(self, *args, **kwargs) -> Coroutine[Any, Any, str]:
"""
Calls self._call() asynchronously in a separate thread for providers
Expand Down Expand Up @@ -409,23 +357,25 @@ def get_chat_prompt_template(self) -> PromptTemplate:
return ChatPromptTemplate.from_messages(
[
SystemMessagePromptTemplate.from_template(
CHAT_SYSTEM_PROMPT
).format(provider_name=name, local_model_id=self.model_id),
MessagesPlaceholder(variable_name="history"),
self.chat_system_prompt,
template_format="jinja2"
),
HumanMessagePromptTemplate.from_template(
HUMAN_MESSAGE_TEMPLATE,
template_format="jinja2",
self.chat_default_prompt,
template_format="jinja2"
),
MessagesPlaceholder(variable_name="history"),
HumanMessagePromptTemplate.from_template("{input}"),
]
)
else:
return PromptTemplate(
input_variables=["history", "input", "context"],
template=CHAT_SYSTEM_PROMPT.format(
template=self.chat_system_prompt.format(
provider_name=name, local_model_id=self.model_id
)
+ "\n\n"
+ CHAT_DEFAULT_TEMPLATE,
+ self.chat_default_prompt,
template_format="jinja2",
)

Expand All @@ -437,18 +387,18 @@ def get_completion_prompt_template(self) -> PromptTemplate:
if self.is_chat_provider:
return ChatPromptTemplate.from_messages(
[
SystemMessagePromptTemplate.from_template(COMPLETION_SYSTEM_PROMPT),
SystemMessagePromptTemplate.from_template(self.completion_system_prompt),
HumanMessagePromptTemplate.from_template(
COMPLETION_DEFAULT_TEMPLATE, template_format="jinja2"
self.completion_default_prompt, template_format="jinja2"
),
]
)
else:
return PromptTemplate(
input_variables=["prefix", "suffix", "language", "filename"],
template=COMPLETION_SYSTEM_PROMPT
template=self.completion_default_prompt
+ "\n\n"
+ COMPLETION_DEFAULT_TEMPLATE,
+ self.completion_default_prompt,
template_format="jinja2",
)

Expand Down
Loading