@@ -671,9 +671,15 @@ def test_live_run_serverless(self):
671
671
assert isinstance (response ["replies" ], list )
672
672
assert len (response ["replies" ]) > 0
673
673
assert [isinstance (reply , ChatMessage ) for reply in response ["replies" ]]
674
- assert "usage" in response ["replies" ][0 ].meta
675
- assert "prompt_tokens" in response ["replies" ][0 ].meta ["usage" ]
676
- assert "completion_tokens" in response ["replies" ][0 ].meta ["usage" ]
674
+ assert response ["replies" ][0 ].text is not None
675
+ meta = response ["replies" ][0 ].meta
676
+ assert "usage" in meta
677
+ assert "prompt_tokens" in meta ["usage" ]
678
+ assert meta ["usage" ]["prompt_tokens" ] > 0
679
+ assert "completion_tokens" in meta ["usage" ]
680
+ assert meta ["usage" ]["completion_tokens" ] > 0
681
+ assert meta ["model" ] == "microsoft/Phi-3.5-mini-instruct"
682
+ assert meta ["finish_reason" ] is not None
677
683
678
684
@pytest .mark .integration
679
685
@pytest .mark .slow
@@ -701,13 +707,18 @@ def test_live_run_serverless_streaming(self):
701
707
assert isinstance (response ["replies" ], list )
702
708
assert len (response ["replies" ]) > 0
703
709
assert [isinstance (reply , ChatMessage ) for reply in response ["replies" ]]
710
+ assert response ["replies" ][0 ].text is not None
704
711
705
712
response_meta = response ["replies" ][0 ].meta
706
713
assert "completion_start_time" in response_meta
707
714
assert datetime .fromisoformat (response_meta ["completion_start_time" ]) <= datetime .now ()
708
715
assert "usage" in response_meta
709
716
assert "prompt_tokens" in response_meta ["usage" ]
717
+ assert response_meta ["usage" ]["prompt_tokens" ] == 0
710
718
assert "completion_tokens" in response_meta ["usage" ]
719
+ assert response_meta ["usage" ]["completion_tokens" ] == 0
720
+ assert response_meta ["model" ] == "microsoft/Phi-3.5-mini-instruct"
721
+ assert response_meta ["finish_reason" ] is not None
711
722
712
723
@pytest .mark .integration
713
724
@pytest .mark .slow
@@ -926,9 +937,16 @@ async def test_live_run_async_serverless(self):
926
937
assert isinstance (response ["replies" ], list )
927
938
assert len (response ["replies" ]) > 0
928
939
assert [isinstance (reply , ChatMessage ) for reply in response ["replies" ]]
929
- assert "usage" in response ["replies" ][0 ].meta
930
- assert "prompt_tokens" in response ["replies" ][0 ].meta ["usage" ]
931
- assert "completion_tokens" in response ["replies" ][0 ].meta ["usage" ]
940
+ assert response ["replies" ][0 ].text is not None
941
+
942
+ meta = response ["replies" ][0 ].meta
943
+ assert "usage" in meta
944
+ assert "prompt_tokens" in meta ["usage" ]
945
+ assert meta ["usage" ]["prompt_tokens" ] > 0
946
+ assert "completion_tokens" in meta ["usage" ]
947
+ assert meta ["usage" ]["completion_tokens" ] > 0
948
+ assert meta ["model" ] == "microsoft/Phi-3.5-mini-instruct"
949
+ assert meta ["finish_reason" ] is not None
932
950
finally :
933
951
await generator ._async_client .close ()
934
952
0 commit comments