mirror of
https://github.com/infiniflow/ragflow.git
synced 2025-12-08 12:32:30 +08:00
### What problem does this PR solve? Add Jira connector. <img width="978" height="925" alt="image" src="https://github.com/user-attachments/assets/78bb5c77-2710-4569-a76e-9087ca23b227" /> --- <img width="1903" height="489" alt="image" src="https://github.com/user-attachments/assets/193bc5c5-f751-4bd5-883a-2173282c2b96" /> --- <img width="1035" height="925" alt="image" src="https://github.com/user-attachments/assets/1a0aec19-30eb-4ada-9283-61d1c915f59d" /> --- <img width="1905" height="601" alt="image" src="https://github.com/user-attachments/assets/3dde1062-3f27-4717-8e09-fd5fd5e64171" /> ### Type of change - [x] New Feature (non-breaking change which adds functionality)
150 lines
4.7 KiB
Python
150 lines
4.7 KiB
Python
"""Helper utilities for the Jira connector."""
|
|
|
|
from __future__ import annotations
|
|
|
|
import os
|
|
from collections.abc import Collection
|
|
from datetime import datetime, timezone
|
|
from typing import Any, Iterable
|
|
|
|
from jira.resources import Issue
|
|
|
|
from common.data_source.utils import datetime_from_string
|
|
|
|
JIRA_SERVER_API_VERSION = os.environ.get("JIRA_SERVER_API_VERSION", "2")
|
|
JIRA_CLOUD_API_VERSION = os.environ.get("JIRA_CLOUD_API_VERSION", "3")
|
|
|
|
|
|
def build_issue_url(base_url: str, issue_key: str) -> str:
|
|
"""Return the canonical UI URL for a Jira issue."""
|
|
return f"{base_url.rstrip('/')}/browse/{issue_key}"
|
|
|
|
|
|
def parse_jira_datetime(value: Any) -> datetime | None:
|
|
"""Best-effort parse of Jira datetime values to aware UTC datetimes."""
|
|
if value is None:
|
|
return None
|
|
if isinstance(value, datetime):
|
|
return value.astimezone(timezone.utc) if value.tzinfo else value.replace(tzinfo=timezone.utc)
|
|
if isinstance(value, str):
|
|
return datetime_from_string(value)
|
|
return None
|
|
|
|
|
|
def extract_named_value(value: Any) -> str | None:
|
|
"""Extract a readable string out of Jira's typed objects."""
|
|
if value is None:
|
|
return None
|
|
if isinstance(value, str):
|
|
return value
|
|
if isinstance(value, dict):
|
|
return value.get("name") or value.get("value")
|
|
return getattr(value, "name", None)
|
|
|
|
|
|
def extract_user(value: Any) -> tuple[str | None, str | None]:
|
|
"""Return display name + email tuple for a Jira user blob."""
|
|
if value is None:
|
|
return None, None
|
|
if isinstance(value, dict):
|
|
return value.get("displayName"), value.get("emailAddress")
|
|
|
|
display = getattr(value, "displayName", None)
|
|
email = getattr(value, "emailAddress", None)
|
|
return display, email
|
|
|
|
|
|
def extract_text_from_adf(adf: Any) -> str:
|
|
"""Flatten Atlassian Document Format (ADF) structures to text."""
|
|
texts: list[str] = []
|
|
|
|
def _walk(node: Any) -> None:
|
|
if node is None:
|
|
return
|
|
if isinstance(node, dict):
|
|
node_type = node.get("type")
|
|
if node_type == "text":
|
|
texts.append(node.get("text", ""))
|
|
for child in node.get("content", []):
|
|
_walk(child)
|
|
elif isinstance(node, list):
|
|
for child in node:
|
|
_walk(child)
|
|
|
|
_walk(adf)
|
|
return "\n".join(part for part in texts if part)
|
|
|
|
|
|
def extract_body_text(value: Any) -> str:
|
|
"""Normalize Jira description/comments (raw/adf/str) into plain text."""
|
|
if value is None:
|
|
return ""
|
|
if isinstance(value, str):
|
|
return value.strip()
|
|
if isinstance(value, dict):
|
|
return extract_text_from_adf(value).strip()
|
|
return str(value).strip()
|
|
|
|
|
|
def format_comments(
|
|
comment_block: Any,
|
|
*,
|
|
blacklist: Collection[str],
|
|
) -> str:
|
|
"""Convert Jira comments into a markdown-ish bullet list."""
|
|
if not isinstance(comment_block, dict):
|
|
return ""
|
|
|
|
comments = comment_block.get("comments") or []
|
|
lines: list[str] = []
|
|
normalized_blacklist = {email.lower() for email in blacklist if email}
|
|
|
|
for comment in comments:
|
|
author = comment.get("author") or {}
|
|
author_email = (author.get("emailAddress") or "").lower()
|
|
if author_email and author_email in normalized_blacklist:
|
|
continue
|
|
|
|
author_name = author.get("displayName") or author.get("name") or author_email or "Unknown"
|
|
created = parse_jira_datetime(comment.get("created"))
|
|
created_str = created.isoformat() if created else "Unknown time"
|
|
body = extract_body_text(comment.get("body"))
|
|
if not body:
|
|
continue
|
|
|
|
lines.append(f"- {author_name} ({created_str}):\n{body}")
|
|
|
|
return "\n\n".join(lines)
|
|
|
|
|
|
def format_attachments(attachments: Any) -> str:
|
|
"""List Jira attachments as bullet points."""
|
|
if not isinstance(attachments, list):
|
|
return ""
|
|
|
|
attachment_lines: list[str] = []
|
|
for attachment in attachments:
|
|
filename = attachment.get("filename")
|
|
if not filename:
|
|
continue
|
|
size = attachment.get("size")
|
|
size_text = f" ({size} bytes)" if isinstance(size, int) else ""
|
|
content_url = attachment.get("content") or ""
|
|
url_suffix = f" -> {content_url}" if content_url else ""
|
|
attachment_lines.append(f"- {filename}{size_text}{url_suffix}")
|
|
|
|
return "\n".join(attachment_lines)
|
|
|
|
|
|
def should_skip_issue(issue: Issue, labels_to_skip: set[str]) -> bool:
|
|
"""Return True if the issue contains any label from the skip list."""
|
|
if not labels_to_skip:
|
|
return False
|
|
|
|
fields = getattr(issue, "raw", {}).get("fields", {})
|
|
labels: Iterable[str] = fields.get("labels") or []
|
|
for label in labels:
|
|
if (label or "").lower() in labels_to_skip:
|
|
return True
|
|
return False
|