-
Notifications
You must be signed in to change notification settings - Fork 1.2k
Expand file tree
/
Copy pathtest_streaming_fidelity_e2e.py
More file actions
188 lines (146 loc) · 7.19 KB
/
test_streaming_fidelity_e2e.py
File metadata and controls
188 lines (146 loc) · 7.19 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
"""E2E Streaming Fidelity Tests"""
import os
import pytest
from copilot import CopilotClient, RuntimeConnection
from copilot.session import PermissionHandler
from .testharness import E2ETestContext
pytestmark = pytest.mark.asyncio(loop_scope="module")
class TestStreamingFidelity:
async def test_should_produce_delta_events_when_streaming_is_enabled(self, ctx: E2ETestContext):
session = await ctx.client.create_session(
on_permission_request=PermissionHandler.approve_all, streaming=True
)
events = []
session.on(lambda event: events.append(event))
await session.send_and_wait("Count from 1 to 5, separated by commas.")
types = [e.type.value for e in events]
# Should have streaming deltas before the final message
delta_events = [e for e in events if e.type.value == "assistant.message_delta"]
assert len(delta_events) >= 1
# Deltas should have content
for delta in delta_events:
delta_content = getattr(delta.data, "delta_content", None)
assert delta_content is not None
assert isinstance(delta_content, str)
# Should still have a final assistant.message
assert "assistant.message" in types
# Deltas should come before the final message
first_delta_idx = types.index("assistant.message_delta")
last_assistant_idx = len(types) - 1 - types[::-1].index("assistant.message")
assert first_delta_idx < last_assistant_idx
await session.disconnect()
async def test_should_not_produce_deltas_when_streaming_is_disabled(self, ctx: E2ETestContext):
session = await ctx.client.create_session(
on_permission_request=PermissionHandler.approve_all, streaming=False
)
events = []
session.on(lambda event: events.append(event))
await session.send_and_wait("Say 'hello world'.")
delta_events = [e for e in events if e.type.value == "assistant.message_delta"]
# No deltas when streaming is off
assert len(delta_events) == 0
# But should still have a final assistant.message
assistant_events = [e for e in events if e.type.value == "assistant.message"]
assert len(assistant_events) >= 1
await session.disconnect()
async def test_should_produce_deltas_after_session_resume(self, ctx: E2ETestContext):
session = await ctx.client.create_session(
on_permission_request=PermissionHandler.approve_all, streaming=False
)
await session.send_and_wait("What is 3 + 6?")
await session.disconnect()
# Resume using a new client
github_token = (
"fake-token-for-e2e-tests" if os.environ.get("GITHUB_ACTIONS") == "true" else None
)
new_client = CopilotClient(
connection=RuntimeConnection.for_stdio(path=ctx.cli_path),
working_directory=ctx.work_dir,
env=ctx.get_env(),
github_token=github_token,
)
try:
session2 = await new_client.resume_session(
session.session_id,
on_permission_request=PermissionHandler.approve_all,
streaming=True,
)
events = []
session2.on(lambda event: events.append(event))
answer = await session2.send_and_wait("Now if you double that, what do you get?")
assert answer is not None
assert "18" in answer.data.content
# Should have streaming deltas before the final message
delta_events = [e for e in events if e.type.value == "assistant.message_delta"]
assert len(delta_events) >= 1
# Deltas should have content
for delta in delta_events:
delta_content = getattr(delta.data, "delta_content", None)
assert delta_content is not None
assert isinstance(delta_content, str)
await session2.disconnect()
finally:
await new_client.force_stop()
async def test_should_not_produce_deltas_after_session_resume_with_streaming_disabled(
self, ctx: E2ETestContext
):
"""Resume with streaming=False — no delta events, but final message arrives."""
github_token = (
"fake-token-for-e2e-tests" if os.environ.get("GITHUB_ACTIONS") == "true" else None
)
# Create and complete a turn with streaming enabled
session = await ctx.client.create_session(
on_permission_request=PermissionHandler.approve_all, streaming=True
)
await session.send_and_wait("What is 3 + 6?")
session_id = session.session_id
await session.disconnect()
# Resume with streaming disabled
new_client = CopilotClient(
connection=RuntimeConnection.for_stdio(path=ctx.cli_path),
working_directory=ctx.work_dir,
env=ctx.get_env(),
github_token=github_token,
)
try:
session2 = await new_client.resume_session(
session_id,
on_permission_request=PermissionHandler.approve_all,
streaming=False,
)
events = []
session2.on(lambda event: events.append(event))
answer = await session2.send_and_wait("Now if you double that, what do you get?")
assert answer is not None
delta_events = [e for e in events if e.type.value == "assistant.message_delta"]
assert len(delta_events) == 0, "No deltas expected when streaming=False"
assistant_events = [e for e in events if e.type.value == "assistant.message"]
assert len(assistant_events) >= 1, "Final assistant.message must still arrive"
await session2.disconnect()
finally:
await new_client.force_stop()
async def test_should_emit_streaming_deltas_with_reasoning_effort_configured(
self, ctx: E2ETestContext
):
"""Streaming + reasoning_effort produces delta events and session.start shows effort."""
from copilot.generated.session_events import SessionStartData
session = await ctx.client.create_session(
on_permission_request=PermissionHandler.approve_all,
streaming=True,
reasoning_effort="high",
)
events = []
session.on(lambda event: events.append(event))
try:
await session.send_and_wait("What is 15 * 17?", timeout=60.0)
delta_events = [e for e in events if e.type.value == "assistant.message_delta"]
assert len(delta_events) >= 1, "Expected delta events with streaming=True"
assistant_events = [e for e in events if e.type.value == "assistant.message"]
assert len(assistant_events) >= 1, "Expected final assistant.message"
# Check session.start event (from get_events) has reasoning_effort
all_msgs = await session.get_events()
start_event = next((e for e in all_msgs if isinstance(e.data, SessionStartData)), None)
assert start_event is not None, "Expected session.start event"
assert start_event.data.reasoning_effort == "high"
finally:
await session.disconnect()