segments.py 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157
  1. import json
  2. import sys
  3. from collections.abc import Mapping, Sequence
  4. from typing import Any
  5. from pydantic import BaseModel, ConfigDict, field_validator
  6. from core.file import File
  7. from .types import SegmentType
  8. class Segment(BaseModel):
  9. model_config = ConfigDict(frozen=True)
  10. value_type: SegmentType
  11. value: Any
  12. @field_validator("value_type")
  13. @classmethod
  14. def validate_value_type(cls, value):
  15. """
  16. This validator checks if the provided value is equal to the default value of the 'value_type' field.
  17. If the value is different, a ValueError is raised.
  18. """
  19. if value != cls.model_fields["value_type"].default:
  20. raise ValueError("Cannot modify 'value_type'")
  21. return value
  22. @property
  23. def text(self) -> str:
  24. return str(self.value)
  25. @property
  26. def log(self) -> str:
  27. return str(self.value)
  28. @property
  29. def markdown(self) -> str:
  30. return str(self.value)
  31. @property
  32. def size(self) -> int:
  33. """
  34. Return the size of the value in bytes.
  35. """
  36. return sys.getsizeof(self.value)
  37. def to_object(self) -> Any:
  38. return self.value
  39. class NoneSegment(Segment):
  40. value_type: SegmentType = SegmentType.NONE
  41. value: None = None
  42. @property
  43. def text(self) -> str:
  44. return ""
  45. @property
  46. def log(self) -> str:
  47. return ""
  48. @property
  49. def markdown(self) -> str:
  50. return ""
  51. class StringSegment(Segment):
  52. value_type: SegmentType = SegmentType.STRING
  53. value: str
  54. class FloatSegment(Segment):
  55. value_type: SegmentType = SegmentType.NUMBER
  56. value: float
  57. class IntegerSegment(Segment):
  58. value_type: SegmentType = SegmentType.NUMBER
  59. value: int
  60. class ObjectSegment(Segment):
  61. value_type: SegmentType = SegmentType.OBJECT
  62. value: Mapping[str, Any]
  63. @property
  64. def text(self) -> str:
  65. return json.dumps(self.model_dump()["value"], ensure_ascii=False)
  66. @property
  67. def log(self) -> str:
  68. return json.dumps(self.model_dump()["value"], ensure_ascii=False, indent=2)
  69. @property
  70. def markdown(self) -> str:
  71. return json.dumps(self.model_dump()["value"], ensure_ascii=False, indent=2)
  72. class ArraySegment(Segment):
  73. @property
  74. def markdown(self) -> str:
  75. items = []
  76. for item in self.value:
  77. items.append(str(item))
  78. return "\n".join(items)
  79. class FileSegment(Segment):
  80. value_type: SegmentType = SegmentType.FILE
  81. value: File
  82. @property
  83. def markdown(self) -> str:
  84. return self.value.markdown
  85. @property
  86. def log(self) -> str:
  87. return str(self.value)
  88. @property
  89. def text(self) -> str:
  90. return str(self.value)
  91. class ArrayAnySegment(ArraySegment):
  92. value_type: SegmentType = SegmentType.ARRAY_ANY
  93. value: Sequence[Any]
  94. class ArrayStringSegment(ArraySegment):
  95. value_type: SegmentType = SegmentType.ARRAY_STRING
  96. value: Sequence[str]
  97. class ArrayNumberSegment(ArraySegment):
  98. value_type: SegmentType = SegmentType.ARRAY_NUMBER
  99. value: Sequence[float | int]
  100. class ArrayObjectSegment(ArraySegment):
  101. value_type: SegmentType = SegmentType.ARRAY_OBJECT
  102. value: Sequence[Mapping[str, Any]]
  103. class ArrayFileSegment(ArraySegment):
  104. value_type: SegmentType = SegmentType.ARRAY_FILE
  105. value: Sequence[File]
  106. @property
  107. def markdown(self) -> str:
  108. items = []
  109. for item in self.value:
  110. items.append(item.markdown)
  111. return "\n".join(items)