How We Improved Speaker Name Mapping Using Advanced Language Models
When working with earnings call audio files, tools like WhisperX are invaluable for generating transcriptions. However, out of the box, WhisperX assigns generic speaker labels such as spk01
, spk02
, and so on. Our goal was to replace these placeholders with the actual names and titles of each speaker to make the transcripts more informative and user-friendly.
Our Initial Approach: Utilizing spaCy for Named Entity Recognition
We first attempted to leverage spaCy
, a powerful natural language processing library, to identify names within the transcribed text. The idea was to parse the text for person entities and map them to the corresponding speaker labels. While this method showed some initial promise, it ultimately fell short due to the nuances and inconsistencies in how speakers are introduced during earnings calls.
For instance, our approach assumed that each speaker would be introduced before they began speaking—a reasonable assumption but not always accurate. Sometimes, introductions included only a first name or were intermixed with other names, leading to confusion. These exceptions undermined the reliability of our deterministic code.
Here’s a simplified version of the code we implemented:
Pythondef create_text_with_speaker_labels(data: dict) -> str:
speaker_groups = data["speaker_groups"]
result = ""
for speaker_group in speaker_groups:
speaker_label = speaker_group["speaker"]
speaker_text = " ".join(speaker_group["words"])
result += f"{speaker_label}:\n{speaker_text}\n"
return result
def create_speaker_name_mapping(data: dict,
use_optimized_find_people: bool = True) -> dict:
create_speaker_map_start_time = time.time()
speaker_groups = data["speaker_groups"]
log.info(f"create_speaker_name_mapping for {len(speaker_groups)} speaker groups..")
# Find People is compute bound work: https://stackoverflow.com/a/71367751
# Therefore it doesn't help to use threads here, must use separate processes.
with Pool(PROCESSES_WORKER_COUNT) as pool:
if use_optimized_find_people:
find_people_impl = find_people_optimized
else:
find_people_impl = find_people
peoples = pool.map(find_people_impl, map(lambda _group: " ".join(_group["words"]), speaker_groups))
speaker_map = {}
for i, (people, group) in enumerate(zip(peoples, speaker_groups)):
speaker_key = group["speaker"]
if i == 0:
speaker_map[speaker_key] = "Operator" # Assume the first speaker is the operator
if i + 1 >= len(speaker_groups):
continue
next_speaker_key = speaker_groups[i+1]["speaker"]
if next_speaker_key in speaker_map:
continue # Don't assign the speaker more than once
if len(people) == 0:
continue # No people found in this section of text
speaker_map[next_speaker_key] = people[0] # For now, just pick the first person found.
create_speaker_map_elapsed_seconds = time.time() - create_speaker_map_start_time
log.info(f"Speaker name mapping completed in {verbose_timedelta(create_speaker_map_elapsed_seconds)}.")
return speaker_map
def find_people_in_sentences(text: str) -> List[dict]:
"""
Give a string of text, find the sentences contained therein that contain people's names.
text (str): A string of text. Usually should be a paragraph (one speaker talking).
RETURNS: A list of sentences and people. The sentence is a list of Tokens
Example Result:
[
{
'people': ['Melissa Napier'],
'sentence': [Token, Token, Token...],
'text': 'Before I hand the call over to Melissa Napier, I want to reiterate our confidence in the path ahead.'
}
]
"""
import spacy
log.debug(f"find_people() on text of length: {len(text)}")
log.debug("Loading spacy en_core_web_sm ..")
load_start = time.time()
nlp = spacy.load("en_core_web_sm")
log.debug(f"Finished loading spacy en_core_web_sm in {time.time() - load_start} seconds.")
doc = nlp(text)
# tokens = [(w.text, w.pos_, w.ent_type_) for w in doc]
sentences = []
sentence = []
for token in doc:
sentence.append(token)
# print(token)
if token.text == ".":
sentences.append(sentence)
sentence = []
result = []
for sentence in sentences:
people = []
# sentence_text = " ".join([x.text for x in sentence])
# print(sentence_text)
# spacy.tokens.token
sentence_text = None
for i, token in enumerate(sentence):
# print(token.text, token.lemma_, token.pos_, token.tag_, token.dep_,
# token.shape_, token.is_alpha, token.is_stop)
# if "Sean" in token.text:
# print(token)
# if "Nakesh" in token.text:
# print(token)
if i == 0:
sentence_text = token.sent.text
if token.ent_type_ == "PERSON":
if i > 0 and sentence[i-1].ent_type_ == "PERSON":
people[-1] += f" {token.text}" # This is the same person, probably the person's last name.
else:
people.append(token.text)
log.debug(f"Person: {token.text}")
result.append({"text": sentence_text, "sentence": sentence, "people": people})
return result
def find_people(text: str) -> List[str]:
people_and_sentences = find_people_in_sentences(text)
people = [people_and_sentence["people"] for people_and_sentence in people_and_sentences]
return [item for row in people for item in row]
def has_introduction(sentence: str) -> bool:
lower_case_sentence = sentence.lower()
introductions = [
"introduce",
"pass the call over",
"hand the call over",
"hand it off",
"our next question",
]
for introduction in introductions:
if introduction in lower_case_sentence:
return True
return False
def score_sentence(sentence_index: int, sentence: str) -> int:
if has_introduction(sentence):
return 1000 + sentence_index
return sentence_index
def find_people_optimized(text: str) -> List[str]:
"""
Find people in a given text.
Args:
text (str): The text to find people in.
Returns:
List[str]: A list of people found in the text.
"""
people_and_scores = []
for i, sent in enumerate(find_people_in_sentences(text)):
people = sent["people"]
text = sent["text"]
if len(people) == 0: # Ignore sentences with no people found.
continue
people_and_scores.append({"people": people, "text": text, "score": score_sentence(i, text)})
# Sort in reverse (descending order) such that the highest scored people list is on top.
sorted_people = sorted(people_and_scores, key=lambda _x: _x["score"], reverse=True)
for x in sorted_people:
log.info(f"{x['score']} : {x['people']} - {x['text']}")
# print(f"{x['score']} : {x['people']} - {x['text']}")
return [people for peoples in sorted_people for people in peoples["people"]]
Despite our best efforts and the robustness of the code, the approach was too brittle. The myriad ways in which speakers introduce themselves—or are introduced—proved too variable for a deterministic method to handle effectively.
Turning to Advanced Language Models
Recognizing the limitations of our initial strategy, we decided to explore the capabilities of advanced language models. With recent developments in natural language processing, models like OpenAI’s GPT series have demonstrated remarkable proficiency in understanding and generating human-like text.
By crafting a carefully designed prompt, we aimed to leverage these models’ complex reasoning abilities to map speaker labels to actual names accurately. The language model could comprehend context, handle variations in introductions, and account for inconsistencies that our code could not.
Here's an example prompt we fed to Chat GPT:
Plain text<INSTRUCTIONS> Given the following transcript, please map the speaker labels to the actual names of the speakers: <TRANSCRIPT> spk07: Welcome to the year 2023 fourth quarter earnings conference call. At this time, all participants are in a listen-only mode. A question and answer session will follow the formal presentation. If anyone should require operator assistance during the conference, please press star zero on your telephone keypad. As a reminder, this conference is being recorded. I would now like to turn the conference over to your host, Brett Iverson, Vice President of Investor Relations. Mr. Iverson, please go ahead. spk10: Good afternoon, and thank you for joining us today. On the call with me are Satya Nadella, Chairman and Chief Executive Officer, Amy Hood, Chief Financial Officer, Alice Jolla, Chief Accounting Officer, and Keith Dolliver, Deputy General Counsel. On the Microsoft Investor Relations website, you can find our earnings press release and financial summary slide deck, which is intended to supplement our prepared remarks during today's call, and provides the reconciliation of differences between GAAP and non-GAAP financial measures. More detailed outlook slides will be available on the Microsoft Investor Relations website when we provide outlook commentary on today's call. On this call, we will discuss certain non-GAAP items. The non-GAAP financial measures provided should not be considered as a substitute for or superior to the measures of financial performance prepared in accordance with GAAP. They are included as additional clarifying items to aid investors in further understanding the company's fourth quarter performance in addition to the impact these items and events have on the financial results. All growth comparisons we make on the call today relate to the corresponding period of last year, unless otherwise noted. We will also provide growth rates in constant currency when available as a framework for assessing how our underlying businesses performed, excluding the effect of foreign currency rate fluctuations. where growth rates are the same in constant currency, we'll refer to the growth rate only. We'll post our prepared remarks to our website immediately following the call until the complete transcript is available. Today's call is being webcast live and recorded. If you ask a question, it will be included in our live transmission, in the transcript, and in any future use of the recording. You can replay the call and view the transcript on the Microsoft Investor Relations website. During this call, we will be making forward-looking statements, which are predictions, projections, or other statements about future events. These statements are based on current expectations and assumptions that are subject to risks and uncertainties. Actual results could materially differ because of factors discussed in today's earnings press release, in the comments made during this conference call, and in the risk factor section of our Form 10-K, Forms 10-Q, and other reports and filings with the Securities and Exchange Commission. We do not undertake any duty to update any forward-looking statement. And with that, I'll turn the call over to Satya. spk06: Thank you very much, Brett. We had a solid close to our fiscal year. The Microsoft Cloud surpassed $110 billion in annual revenue, up 27% in constant currency, with Azure all up accounting for more than 50% of the total for the first time. Every customer I speak with is asking not only how, but how fast they can apply next generation AI to address the biggest opportunities and challenges they face, and to do so safely and responsibly. To that end, we remain focused on three key priorities. First, helping customers use the breadth and depth of Microsoft Cloud to get the most value out of their spend. Second, investing to lead in the new AI platform shift by infusing AI across every layer of the tech stack. And third, driving operating leverage. Now I'll highlight examples of our progress, starting with infrastructure. Azure continues to take share as customers migrate their existing workloads and invest in new ones. We continue to see more cloud migrations as it remains early when it comes to long-term cloud opportunity. We're also seeing increasing momentum with Azure Arc, which now has 18,000 customers up 150% year-over-year, including Carnival Corp, Domino's, Thermo Fisher. And Azure AI is ushering in new, born-in-the-cloud AI-first workloads with the best selection of frontier and open models, including Meta's recent announcement supporting Lama on Azure and Windows, as well as OpenAI. We have great momentum across Azure OpenAI service. More than 11,000 organizations across industries, including IKEA, Volvo Group, Zurich Insurance, as well as digital natives like Flipkart, Humane, Kahoot, Miro, Typeface use the service. That's nearly 100 new customers added every day this quarter. Mercedes-Benz, for example, is bringing ChatGPT via Azure OpenAI to more than 900,000 vehicles in the United States, making its in-car voice assistant more intuitive. And Moody's built its own internal co-pilot to improve productivity of its 14,000 employees. We're also partnering broadly to scale this next generation of AI to more customers. Snowflake, for example, will increase its Azure spend as it builds new integrations with Azure OpenAI, and KPMG has announced a multi-billion dollar commitment to our cloud and AI services to transform professional services. Now on to data. Every AI app starts with data, and having a comprehensive data and analytics platform is more important than ever. Our intelligent data platform brings together operational databases, analytics, and governance so organizations can spend more time creating value and less time integrating their data estate. We introduced Microsoft Fabric this quarter, which unifies compute, storage, and governance with a disruptive business model. One month in, we are encouraged by early interest and usage. Over 8,000 customers have signed up to trial the service and are actively using it, and over 50% are using four or more workloads. All up, we once again took share with our analytic solutions with customers like Bridgestone, Chevron, and Equinor turning to our stack. Now on to developers. New Azure AI Studio is becoming the tool of choice for AI development in this new era, helping organizations ground, fine-tune, evaluate, and deploy models and do so responsibly. VS Code and GitHub Copilot are category-leading products when it comes to how developers code every day, Nearly 90% of GitHub co-pilot sign-ups are self-service, indicating strong organic interest and pull-through. More than 27,000 organizations, up 2x quarter over quarter, have chosen GitHub Co-Pilot for Business to increase the productivity of their developers, including Airbnb, Dell, and Scandinavian Airlines. We're also applying AI across low-code, no-code toolchain to help domain experts automate workflows, create apps and web pages, build virtual agents, or analyze data using just natural language. Co-pilot in Power BI combines the power of large language models with an organization's data to generate insights faster, and co-pilot in Power Pages makes it easier to create secure low-code business websites. One of our tools that's really taken off is Copilot and Power Virtual Agents, which is delivering one of the biggest benefits of this new era of AI, helping customer service agents be significantly more productive. HP and Virgin Money, for example, have both built custom chatbots with Copilot and Power Virtual Agents that were trained to answer complex customer inquiries. All up, more than 63,000 organizations have used AI-powered capabilities in Power Platform, up 75% quarter over quarter. Finally, Power Automate now has 10 million monthly active users at companies like Jaguar, Land Rover, Repsol, Rolls-Royce, up 55% year over year. And we're going further with new process mining capabilities in Power Automate, which are helping organizations optimize business processes and in turn build their AI advantage. Now on to business applications. We are taking share in every category as we help organizations across the private and public sector from Avis to Albertsons to Breville to Equinox and the U.S. Department of Veterans Affairs transform their mission-critical business processes. All Up Dynamics surpassed $5 billion in revenue over the past fiscal year, with our customer experience, service, and finance and supply chain businesses all surpassing $1 billion in annual sales. This quarter, we brought Dynamics 365 Co-Pilot to our ERP portfolio, including finance, project operations, and supply management. And with our new Microsoft Sales Co-Pilot, sellers can ground their customer interactions with data from CRM systems, including both Salesforce and Dynamics, to personalize customer interactions and close more deals. Now on to our industry and cross-industry clouds. Our Microsoft Cloud for Sustainability is helping customers like Costco, Ladder Lakes, and REI take action to meet their environmental goals. And in healthcare, hundreds of organizations are using our Nuance DAX ambient intelligence solution to automatically document patient encounters at the point of care. This quarter, we expanded our collaboration with Epic to integrate Nuance DAX Express directly into their industry-leading EHR system. Now on to future work. Across industries, customers like Ahold Delhaize, Deutsche Bank, Novartis, Siemens, Wells Fargo are choosing Microsoft 365 Premium offerings for differentiated security, compliance, voice, and analytics value. And four months ago, we introduced a new pillar of customer value with Microsoft 365 Copilot. We are now rolling out Microsoft 365 Copilot to 600 paid customers through our early access program. And feedback from organizations like Emirates, NBD, General Motors, Goodyear, and Lumen is that it's a game changer for employee productivity. We continue to build momentum in Microsoft Teams across collaboration, chat, meetings, and calling. We now have more than 1,900 apps in Teams App Store and companies in every industry from British Airways to Dentsu to Eli Lilly and Manulife have built over 145,000 custom line of business apps, bringing business process directly into the flow of work. Five months in, Teams Premium has already surpassed 600,000 seats as companies like BNY Mellon, Clifford Chance, PepsiCo, and Starbucks chose the add-on for advanced features like end-to-end encryption and real-time translation. Teams Phone is the market leader in cloud calling with more than 17 million PSTN users, up 45% year-over-year. Teams Room is used by more than 70% of the Fortune 500, including L'Oreal, United Airlines, and U.S. Bank, and revenue more than doubled year-over-year this quarter. And with Microsoft Viva, we are creating a new market category for employee experience. Viva now has 35 million monthly active users as companies like CBRE, Fujitsu, and Unisys turn to the platform to build data-driven, high-performance organizations. Now on to Windows. The number of devices running Windows 11 has more than doubled in the last year, and we are seeing continued growth in Windows 11 commercial deployments worldwide by companies like AT&T, Kronos, and Westpac. We are also transforming how Windows is experienced and managed for enterprise customers with Azure Virtual Desktop and Windows 365, which together surpassed $1 billion in revenue for the first time over the past 12 months. Enbridge, Eurowings, Marriott International, and TD Bank Group, for example, all chose cloud-delivered Windows this quarter. Windows 11 is also rapidly becoming a powerful new canvas in this new era of AI. We introduced Windows Co-Pilot this quarter, helping every Windows 11 user become a power user with just natural language and are excited to put it in the hands of more people in the coming months. Now on to security. More than 1 million organizations now count on our comprehensive AI-powered solutions to protect their digital estate across clouds and endpoint platforms, up 26% year-over-year. More than 60%, including leading enterprises like ABN Amro, Dow, and Heineken, use four or more of our security products, up 33% year-over-year, underscoring our end-to-end differentiation. And we once again took share across all major categories we serve as we innovate to protect customers. In identity, Microsoft Entra ID has more than 610 million monthly active users, and we are adding SSE to our Entra product family to complement our leading identity solution and secure access to any app or resource from anywhere. Finally, our security co-pilot, the first product to apply this next generation of AI to SecOps, will be available to customers via a paid early access program this fall. Now on to LinkedIn. LinkedIn's revenue surpassed $15 billion for the first time this fiscal year, and membership growth has now accelerated for eight quarters in a row, a testament to how mission critical the platform has become to help more than 950 million members connect, learn, sell, and get hired. Our talent solutions business surpassed $7 billion in revenue for the first time over the past 12 months, and our hiring business took share for the fourth consecutive quarter. We continue to use AI to help our members and customers connect to opportunities and tap into experiences of experts on the platform. Our AI-powered collaborative articles are now the fastest growing traffic driver in LinkedIn. And finally, we are helping LinkedIn stay trusted and authentic. More than 7 million members have verified who they are or where they work, many using new integrations with Microsoft Entra as well as Clear and HyperVerge. Now on to search, advertising, and news. While it's early in our journey, we are reshaping daily search and web habits with our co-pilot for the web. This quarter, we introduced new AI-powered features, including multimodal capabilities with Visual Search and Bing Chat. We're expanding to businesses with Bing Chat Enterprise, which offers commercial data protection, providing an easy on-ramp for any organization looking to get the benefit of this next generation of AI today. Bing is also the default search experience for OpenAI's ChatGPT, bringing timely answers with links to our reputable sources to ChatGPT users. To date, Bing users have engaged in more than 1 billion chats and created more than 750 million images with Bing Image Creator, and Microsoft Edge took share for the ninth consecutive quarter. More broadly, we are growing our ad network, which is now available in 187 markets spanning search, display, native, retail media, video, and connected TV. Now on to gaming. Last week, we extended our Activision Blizzard merger agreement deadline to October. We continue to work through the regulatory approval process and remain confident about getting the deal done. We are committed to bringing more games to more players everywhere. Great content is key to our approach, and our pipeline has never been stronger. We announced our most ambitious lineup of games ever at our showcase last month, including 21 titles that will be available via Xbox Game Pass. And we're looking forward to the release of Starfield this fall, Bethesda's first new universe in 25 years. All up, we set new fourth-quarter highs for monthly active users driven by strength of console as well as monthly active devices. And we saw record fourth-quarter engagement across Game Pass with hours played up 22% year-over-year. And just last week, we announced Game Pass Core, bringing together online play from Xbox Live and content from Game Pass into a single offering. In closing, I'm energized about the opportunities ahead. We continue to innovate across the tech stack to help our customers thrive in the new era of AI. And with that, let me turn it over to Amy. spk04: Thank you, Satya. And good afternoon, everyone. This quarter, revenue was $56.2 billion, up 8% and 10% in constant currency. Earnings per share was $2.69 and increased 21% and 23% in constant currency. In our largest quarter of the year, results exceeded expectations with focused execution by our sales and partner teams. These execution efforts led to share gains again this quarter in Azure, Dynamics, Security, and Edge. In our commercial business, we continued to see healthy renewal strength, which includes our upsell and attach motions, particularly with Microsoft 365 E5. Growth of new business continued to be moderated for products sold outside the Microsoft 365 suite, including standalone Office 365, EMS, and Windows commercial products. As expected in Azure, we saw a continuation of the optimization and new workload trends from the prior quarter. In our consumer business, the PC market overall was in line with expectations, although the early timing of back-to-school inventory bills benefited Windows OEM. Advertising spend was slightly lower than anticipated, which impacted search and news advertising and LinkedIn marketing solutions. Commercial bookings decreased 2% and 1% in constant currency, in line with expectations, against a prior year comparable that was our largest commercial bookings quarter ever. In addition to the healthy execution across our renewal sales motions mentioned earlier, we saw a record number of $10 million plus contracts for both Azure and Microsoft 365. And the average annualized value for our large long-term Azure contracts was the highest it's ever been, driven by customer demand for our innovative cloud solutions today, as well as interest in AI opportunities ahead. Commercial remaining performance obligation increased 19% and 18% in constant currency to $224 billion. Roughly 45% will be recognized in revenue in the next 12 months, up 13% year-over-year. The remaining portion, which will be recognized beyond the next 12 months, increased 22%. And this quarter, our annuity mix increased to 97%. FX impact on total company revenue, segment level revenue, and operating expense growth was as expected. FX decreased COGS growth by one point, one point favorable to expectations. Microsoft Cloud revenue was $30.3 billion and grew 21% and 23% in constant currency, slightly ahead of expectations. Microsoft Cloud gross margin percentage increased roughly three points year-over-year to 72%, also slightly ahead of expectations. Excluding the impact of the change in accounting estimate for useful lives, Microsoft Cloud gross margin percentage increased slightly, driven by improvements in Office 365, partially offset by lower Azure margin, and the impact of scaling our AI infrastructure to meet growing demand. Company gross margin dollars increased 11% and 13% in constant currency, including two points due to the change in accounting estimate. Gross margin percentage increased year-over-year to 70%. Excluding the impact of the change in accounting estimate, gross margin percentage increased slightly, driven by improvements in Office 365. Operating expense increased 2% in line with expectations as savings across the company from our focus on prioritization and efficiency were offset by the charge related to the Irish Data Protection Commission matter. At a total company level, headcount at the end of June was flat compared to a year ago. Operating income increased 18% and 21% in constant currency, including four points due to the change in accounting estimate. operating margins increased roughly four points year-over-year to 43%. Excluding the impact of the change in accounting estimates, operating margins increased roughly two points, driven by improved operating leverage through disciplined cost management. Now, to our segment results. Revenue from productivity and business processes was $18.3 billion and grew 10% and 12% in constant currency, ahead of expectations, with better than expected results in office commercial, partially offset by LinkedIn. Office commercial revenue grew 12% and 14% in constant currency. Office 365 commercial revenue increased 15% and 17% in constant currency, a bit better than expected with particular strength in E5 upsell renewal noted earlier. Paid Office 365 commercial seats grew 11% year over year with installed base expansion across all workloads and customer segments. Seat growth was again driven by our small and medium business and frontline worker offerings. Office commercial licensing declined 20% and 18% in constant currency, with better than expected transactional purchasing. Office consumer revenue increased 3% and 6% in constant currency, with continued momentum in Microsoft 365 subscriptions, which grew 12% to 67 million. LinkedIn revenue increased 5% and 7% in constant currency, driven by growth in talent solutions, with some continued bookings impact from the weaker hiring environment and key verticals. Growth was partially offset by a decline in marketing solutions due to the lower ad spend noted earlier. Dynamics revenue grew 19% and 21% in constant currency, driven by Dynamics 365, which grew 26% and 28% in constant currency, with continued healthy growth across all workloads. Segment gross margin dollars increased 14% and 16% in constant currency, and gross margin percentage increased roughly three points year over year. Excluding the impact of the change in accounting estimate, gross margin percentage increased roughly one point, driven by improvements in Office 365. Operating expenses decreased slightly, and operating income increased 25% and 29% in constant currency, including three points due to the change in accounting estimate. Next, the Intelligent Cloud segment. Revenue was $24 billion, increasing 15% and 17% in constant currency, slightly ahead of expectations. Overall, server products and cloud services revenue increased 17% and 18% in constant currency. Azure and other cloud services revenue grew 26% and 27% in constant currency, including roughly one point from AI services, as expected. In our per-user business, the enterprise mobility and security install base grew 11% to over 256 million seats with impact from the continued growth trends in new business noted earlier. In our on-premises server business, revenue decreased 1% and was relatively unchanged in constant currency, driven by a slight decrease in new annuity contracts, which carry higher in-period revenue recognition. Enterprise services revenue grew 4% and 5% in constant currency, with better than expected performance across enterprise support services and industry solutions. Segment gross margin dollars increased 16% and 17% in constant currency, and gross margin percentage increased slightly. Excluding the impact of the change in accounting estimates, gross margin percentage declined roughly two points, driven by sales mixed shift to Azure and the lower Azure margin noted earlier. Operating expenses increased 10%, Operating income grew 20% and 22% in constant currency, with roughly six points from the change in accounting estimate. Now to more personal computing. Revenue was $13.9 billion, decreasing 4% and 3% in constant currency above expectations, driven by better than expected performance in Windows, partially offset by gaming. Windows OEM revenue decreased 12% year-over-year ahead of expectations due to seven points of benefit from early back-to-school inventory builds, while the overall PC market was as expected. Devices revenue decreased 20% and 18% in constant currency, roughly in line with expectations. Windows commercial products and cloud services revenue increased 2% and 3% in constant currency ahead of expectations due to the renewal strength noted earlier even with the moderated growth of new business and standalone offerings. Search and news advertising revenue XTAC increased 8%, a bit behind expectations due to the lower ad spend noted earlier. Higher search volumes, share gains again this quarter for our Edge browser, and the benefit from the Zander acquisition were partially offset by the impact from third-party partnerships. And in gaming, revenue increased 1% and 2% in constant currency, lower than expected due to weakness in first-party and third-party content performance. Xbox content and services revenue increased 5% and 6% in constant currency, and Xbox hardware revenue declined 13%. Segment gross margin dollars declined 2% and were relatively unchanged in constant currency, and gross margin percentage increased roughly one point year over year, driven by sales makeshift to higher margin businesses. Operating expenses declined 9% and 8% in constant currency. Operating income increased 4% and 6% in constant currency. Now, back to total company results. Capital expenditures, including finance leases, were $10.7 billion to support cloud demand, including investments in AI infrastructure. Cash paid for PP&E was $8.9 billion. Cash flow from operations was $28.8 billion, up 17% year-over-year, as strong cloud billings and collections were partially offset by a tax payment related to the R&D capitalization provision. Free cash flow was $19.8 billion, up 12% year-over-year. Excluding the impact of this tax payment, cash flow from operations increased 22% and free cash flow increased 19%. This quarter, other income and expense was $473 million, higher than anticipated, driven by net gains on foreign currency remeasurement. Our effective tax rate was approximately 19%. And finally, we returned $9.7 billion to shareholders through share repurchases and dividends. bringing our total cash return to our shareholders to over $38 billion for the full fiscal year. Now, let's turn to next fiscal year and start with a few reminders. First, the change in accounting estimate for the useful life of server and network equipment resulted in $3.7 billion of depreciation expense shifting from FY23 to future periods. Our FY23 operating income and margins benefited from this change in accounting estimate, and that will be a headwind to growth in FY24 as the benefit reduces to $2.1 billion. Next, my outlook commentary for both the full year and next quarter is on a U.S. dollar basis and less specifically noted otherwise. And my outlook does not include any impact from the Activision acquisition, which we continue to work towards closing. subject to obtaining required regulatory approvals. Now for some thoughts on the full year of FY24. With the weaker U.S. dollar and assuming current rates remain stable, we expect FX to increase full-year revenue growth by approximately one point, with no impact to COGS or operating expense growth. The impact in H1 is expected to be greater than H2. At a total company level, revenue growth from our commercial business will continue to be driven by the Microsoft Cloud and will again outpace the growth from our consumer business. Even with strong demand and a leadership position, growth from our AI services will be gradual as Azure AI scales and our co-pilots reach general availability dates. So for FY24, the impact will be weighted towards H2. To support our Microsoft Cloud growth and demand for our AI platform, we will accelerate investment in our cloud infrastructure. We expect capital expenditures to increase sequentially each quarter through the year as we scale to meet demand signals. We are committed to driving operating leverage, and therefore we will manage our total cost growth across COGS and operating expense in line with the demand signals we see, as well as revenue growth. Increased capital spend will drive higher COGS growth than in FY23, and FY24 operating expense growth will remain low as we prioritize our spend. Therefore, we expect full-year operating margins to remain flat year-over-year, even with the headwind from the change in accounting estimates. And finally, we expect our FY24 tax rate to be around 19%. Now, to the outlook for the first quarter. First, FX. Based on current rates, we expect FX to increase total revenue and operating expense growth by approximately one point with no impact to COGS growth. Within the segments, we expect FX to increase revenue growth in Intelligent Cloud by one point with no impact to productivity and business processes or more personal computing. and commercial bookings. Strong execution across our core annuity sales motions, including our renewal and upsell motions, along with long-term measure commitments, should drive healthy growth on a growing expiry base. Microsoft Cloud gross margin percentage should decrease roughly one point year over year, driven by the accounting estimate change headwind noted earlier. Excluding that impact, Q1 Cloud gross margin percentage will be up roughly one point, primarily driven by improvements in Azure and Office 365, partially offset by sales makeshift to Azure and the impact of scaling our AI infrastructure to meet growing demand. We expect capital expenditures to increase sequentially on a dollar basis, as noted earlier, driven by investments in our AI infrastructure. Reminder, there can be normal quarterly spend variability in the timing of cloud infrastructure build-out. Next, the segment guidance. In productivity and business processes, we expect revenue to grow between 9 and 11% or 18 to 18.3 billion U.S. dollars. In Office Commercial, revenue growth will again be driven by Office 365 with seat growth across customer segments and ARPU growth through E5. We expect Office 365 revenue growth to be roughly 16% in constant currency. In our on-premises business, we expect revenue to decline in the low 20s. In Office Consumer, we expect revenue growth to be in the low to mid single digits, driven by Microsoft 365 subscriptions. For LinkedIn, we expect revenue growth in the low to mid single digits. Even with share gains in our hiring business, growth will continue to be impacted by the overall markets for recruiting and advertising, especially in the technology industry where we have significant exposure. And in Dynamics, We expect revenue growth in the mid to high teens driven by continued growth in Dynamics 365. For Intelligent Cloud, we expect revenue to grow between 15% and 16%, or 14% and 15% in constant currency. Revenue should be $23.3 to $23.6 billion. Revenue will continue to be driven by Azure, which, as a reminder, can have quarterly variability primarily from our per-user business and from in-period revenue recognition, depending on the mix of contracts. In Azure, we expect revenue growth to be 25 to 26% in constant currency, including roughly two points from all Azure AI services. Growth continues to be driven by our Azure consumption business, and we expect the trends from Q4 to continue into Q1. Our per user business should continue to benefit from Microsoft 365 Suite momentum, though we expect continued moderation in growth rates given the size of the install base. In our on-premises server business, we expect revenue to decline low to mid-single digits against a prior comparable that benefited from annuity purchasing ahead of the SQL Server 2022 launch. And in enterprise services, revenue should decline low to mid-single digits year-over-year as growth in enterprise support services will be more than offset by a decline in industry solutions. In more personal computing, We expect revenue of 12.5 to 12.9 billion U.S. dollars. Windows OEM revenue should decline low to mid-teens, including five points of negative impact from the earlier back-to-school inventory bills that were pulled into the fourth quarter. Our guide assumes no significant changes to the PC demand environment. In devices, revenue should decline in the mid-30s due to the overall PC market and adjustments we made in our portfolio with an increased focus on our higher margin premium products. In Windows commercial products and cloud services, customer demand for Microsoft 365 and our advanced security solutions should drive revenue growth in the mid to high single digits. Search and news advertising ex-tech revenue growth should be mid to high single digits, roughly five points higher than overall search and news advertising revenue, driven by continued volume strength supported by edge browser share gains. Growth will continue to be impacted by the advertising spend environment and third-party partnerships mentioned earlier. We continue to be excited by Bing usage signals and the longer-term opportunity as we invest in AI. And in gaming, we expect revenue growth in the mid-single digits, We expect Xbox content and services revenue growth in the mid to high single digits, driven by first-party and third-party content, as well as Xbox Game Pass. Now back to company guidance. We expect COGS between $16.6 to $16.8 billion U.S. dollars and operating expense of $13.5 to $13.6 billion U.S. dollars. Together, total cost growth should be around 6%. Other income and expense should be roughly $300 million as interest income is expected to more than offset interest expense. Two reminders. This does not include any impact from Activision on interest income and expense, and we are required to recognize mark-to-market gains or losses on our equity portfolio, which can increase quarterly volatility. We expect our Q1 effective tax rate to be around 19%. And finally, As a reminder for Q1 cash flow, we expect to make a $2.7 billion cash tax payment related to the TCJA transition tax. We do not expect a payment related to the R&D capitalization provision in Q1. In closing, as a company, we delivered on the FY23 financial commitments we discussed a year ago on revenue and operating margin. A focus on operational excellence allowed us to achieve these targets while we delivered near-term value to customers and prioritized our investments to continue to lead in the future. As we start FY24, we are excited for the opportunities ahead and remain focused on delivering the three key priorities Sakya mentioned. We'll maintain our lead as the top commercial cloud by helping customers use the breadth and depth of the Microsoft cloud. We'll continue to invest in our cloud and AI infrastructure while scaling with growing demand so we can lead the AI platform wave. And finally, we'll align our costs with growth as we are committed to driving operating leverage. With that, let's go to Q&A, Brett. spk10: Thanks, Amy. We'll now move over to Q&A. Out of respect for others on the call, we request that participants please only ask one question. Joe, can you please repeat your instructions? spk07: Yes. Ladies and gentlemen, if you would like to ask a question, please press star 1 on your telephone keypad, and a confirmation tone will indicate your line is in the question queue. You may press star 2 if you would like to remove your question from the queue. For participants using speaker equipment, it may be necessary to pick up your handset before pressing the star keys. One moment, please, while we poll for questions. And our first question comes from the line of Keith Weiss with Morgan Stanley. Please proceed. spk01: Excellent. Thank you guys for taking the question and a very nice end to a great fiscal year. Satya, you started out your comments talking about how every customer conversation has the customer asking you about utilizing generative AI technology and how fast they could utilize that generative AI technology. What's the answer? What do you tell them in terms of the pace with which that could get into the marketplace and your customers can start using it And then for Amy, how should investors think about just the fundamental gross margins behind these generative AI technologies? We understand there's going to be a lot of CapEx to ramp up underneath these, but what should we expect in terms of what the ultimate gross margin looks like underneath all these new generative AI solutions? Thank you. spk06: Thank you, Keith, for the question. The fundamental guidance and conversation that we have with customers is twofold. One is the easiest path to value auto-generative AI is to adopt certain solutions. For example, GitHub Copilot. In some sense, it's sort of the no-brainer to add productivity leverage for all of the software developers in any organization, whether you're a bank, you're a retailer, or you're a software company. It applies to everyone. So that's probably, you know, one of the things that we have seen very good, you know, even productivity data and great adoption. And then obviously the excitement that there is already around the M365 co-pilot. So first thing we sort of talk about is how we ourselves are deploying all these co-pilots across, whether it's sales co-pilot or M365 co-pilot or GitHub co-pilot, how do you get maximum value out of these horizontal tool chain. And then on top of that, we have taken what we did underneath these products and built it out as a first-class tech stack, which we talked at our developer conference called the Co-Pilot Stack. And then with Azure AI tooling, made it possible for someone like Moody's to build their own co-pilot for their people. you know so to us we want to be able to help customers build their generative AI applications on top of Azure AI and with speed if you will and so those are the two things that we you know we ask them to identify where they can get the maximum productivity leverage and then we even swarm with our own resources to help them you know get those things done and the last comment I'd make is The cloud and data in the cloud enables all this because I think the diffusion cycle here is, in some sense, we have a new set of cloud meters that are getting adopted faster because of everything else that came before it in the cloud. So those would be the observations. spk04: And to your question, Keith, on gross margins and how I think about those going forward, the first thing I would say is that I expect gross margins here to transition over time just like they did in the prior cloud transition. I would also say I expect workloads and the gross margins of the workloads to be different, just like they are in the cloud today. I would also add one thing that's different than last time, we've talked a bit about this before, is that we start out in a different place with more of a shared platform, which allows us to scale those gross margins a bit faster than last time. And we do expect, as you asked and Satya talked about, the pace. of this adoption curve, we do expect to be faster. So you're seeing the CapEx spend accelerate in Q4 and then again in Q1 and we've talked about what it should look like the rest of the year. Now that being said, we're talking about all that and going through that transition while delivering in FY24 over FY23 effectively a point higher operating margins. Because if it's flat, year over year as we guided, with the headwind from the useful life change, when you correct for that, it's about a point higher. So I think the real focus here is being able to be aggressive in meeting the demand curve and focusing on the transition and growth in gross margins delivering the operating leverage. spk10: Excellent. Thank you, guys. Thanks, Keith. Operator, next question, please. spk07: Our next question comes from the line of Brent Till with Jefferies. Please proceed. spk11: Thank you. Satya, on the optimization headwinds that you continue to see, when do you think we hit peak optimization? Are we getting close to hitting that peak and getting some relief in the back half of the year and maybe AI helping provide as a tailwind? Any color from what you're seeing from your perspective would be helpful. spk06: Sure, Brent. Thank you for the question. Yeah, a couple of observations. One is I think overall in the cloud you do see new project starts, and then those project starts get optimized, and then you sort of time series all of that, and that's sort of what you see in the normal course. What happened here was during the pandemic, obviously, there were lots of new project starts, and optimization in some sense was postponed. And that's where you're seeing, I'll call it, catch-up optimization. And that's something that, to your point, we will lap going into the next couple of quarters. I think it will come down. And we are seeing new project starts, both traditional type of project starts, even cloud migrations. data applications, and of course, obviously, the AI applications. But we'll get back to, I'll call it, the normal pace of new project starts and optimizations going forward, but we will cycle through, I think, in the next couple of quarters, what is the last catch-up optimization. spk04: I would just, Everett, I think to Satya's point, and maybe to build a bit of a line for you, you know, I think it felt very similar to last quarter where we made the same comments, which is we're seeing sort of the normal optimization, plus we're seeing new workload starts across these workloads Satya talked about, and I think that's what we're saying going forward, and really what the change is just that lapping of, I think, a bit of the catch-up from a year ago, and you're right, we'll continue to do that through H2. spk10: Thanks. Thanks, Brent. Operator, next question, please. spk07: The next question comes from the line of Mark Mordler with Bernstein Research. Please proceed. spk08: Thank you very much for taking the question and congrats on the quarter. Amy, CACBUX moved up significantly, queue over queue and year over year, and it's increasing moving forward. Can you give us some color? Is it physical data centers? Is it predominantly servers? Is it predominantly AI-driven? How should we think about the useful life of it? And then, quickly for Satya, can you give us some status on the general availability of the full co-pilot development stack and how long it's taking clients and partners to build co-pilots? Thanks. spk04: Well, I start on the CapEx question, Satya, then I'll turn it over to you. Mark, really, first of all, both in Q4 and then talking about Q1, the acceleration is really quite broad. It's both on both the data centers and the physical basis, plus CPUs and GPUs and networking equipment, think of it in a broad sense as opposed to a narrow sense. So it's overall increases of acceleration of overall capacity. And I think if you look back over really FY23, you wouldn't have seen some of the pace on normal, what I would say capacity ads, even for the normal Azure workloads. So you're seeing both accelerations, the normal Azure workloads plus some of the AI workloads is partially the reason. So it's why I do comment quite often that it's both overall commercial cloud demand and building out capacity for AI, it's both. spk06: Yeah, and I think just for perspective, I think it's sort of always good to think about it where we have, what, 111 commercial cloud business growing. at, what, 22 percent year-over-year, and then you had a CapEx growth, which is, you know, around the same number, 23, 24 percent. So in some sense, it's sort of replacement capital plus some new capital that is going to drive new growth. So that's, I think, the scale. And we feel good about that structure of overall, you know, growth rates. and how it translates into future TAM opportunity for us. I went to your other question on how all this translates into project starts effectively. The Copilot stack is available today on Azure. So we have everything from Azure AI tool chain where you can use obviously Azure OpenAI or even you can use open models from Lama and other Hugging Face models. You have all the fabric and all of our operational data stores for what is one of the most useful patterns around generative AI is what is called retrieval augmented generation, which is you take the data that you have in the data stores, use it in a prompt to generate completions, summaries, what have you. And so that's something that we've seen a lot of and the co-pilot are fundamentally orchestrations of that. And so we have all of these services available. The thing that's fascinating is, When you use something like Power Virtual Agent, you have a low-code, no-code tool to build effectively these AI products or full-fledged co-pilots like we've built. And all of the underlying primitives for that are available on Azure. The tool chain is available on Azure. And the speed with which customers are able to deploy them, ISVs are able to build them, is pretty impressive. spk08: Thank you. I appreciate it. spk10: Thanks, Mark. Operator, next question, please. spk07: The next question comes from the line of Cash Rangan with Goldman Sachs. Please proceed. spk05: Hi. Thank you very much. Congratulations on the quarter. If I could, I just wanted to get your thoughts, shift the discussion away from COGS and CAPEX to more of the top line outlook. It looks like Azure growth rate is definitely starting to stabilize and generative AI contribution to Azure is measurably improving quarter by quarter. and optimization in a broader sense is also starting to settle down. Where does this leave with the company's outlook for Azure growth rate in the future quarters Are we at a point where we've bottomed out and we could start to see some acceleration due to the trends we discussed? And also, if you take the superset of Microsoft Cloud, when you throw in the new pricing for co-pilot, it certainly looks like the TAMs are opening up in a pretty significant way. So, when you take that broader lens, that 21%, 22% growth rate that Satya and Amy referred to, What is the, what could be the outlook? Could we be too optimistic in entertaining hopes of some kind of acceleration in the years ahead? Or how do you think about the outlook on the top line? Thank you so much. spk06: Sure, Akash. Thanks for the question. So, maybe I'll start, and then, Amy, you can add. Because I think, we do think about what's the long-term TAM here, right? I mean, this is, you heard me talk about this as a percentage of GDP, what's going to be tech spend. If you believe that let's say the 5% of GDP is gonna go to 10% of GDP, maybe that gets accelerated because of the AI wave, then the question is how much of that goes to the various parts of our commercial cloud and then how competitive are we in each layer, right? So if you sort of break it down, you talked about how Microsoft 365, we think of this co-pilot as a third pillar, right? We had the creation tools, We then add all the communication and collaboration services, and we think the AI co-pilot is a third pillar, so we're excited about it. Amy talked about how we want to get it out first as part of this preview, and then in the second half of the next fiscal year, we'll start getting some, you know, of the real revenue signal from it. So we're looking forward to it, but we think of it long-term as a third pillar, like we thought about, you know, something like, say, Teams or SharePoint back in the day or what have you. Then Azure, you know, the way I think about it is we still are whatever, inning two or inning three of even the cloud migration, especially if you view it, right, whether by industry moves to the cloud, segment move to the cloud, as well as country adoption of the cloud, right? So there's still, you know, early innings of the cloud migration itself, so there's a lot there still. And then on top of that, there is this complete new world of AI driving a set of new workloads. And so we think of that, again, being pretty expansive from a TAM opportunity, and we'll play it out. But at the same time, you know, as we are a $111 billion commercial cloud that has grown you know, in 20s. And so, therefore, we do hit a lot of large numbers. But that said, we do think that this is a business that can have sustained high growth, which is something that, you know, we're excited about. spk04: And I think the only thing, Cash, I would add is, you know, I think in some ways what we're really pointing to is there's a process here. We see the demand signal is quite strong. It remains strong. I'm thrilled with all the product announcements we've made. I'm thrilled with them moving to Preview and then moving to GA. They absolutely are expansive in terms of addressable market. They reach new budget pools is almost the way I talk about it a lot in terms of how CIOs or CFOs that I talk to think about that investment. So a growing opportunity. And as you know, we're focused on executing against that. And then revenue is an outcome. But it certainly does require the demand signal requires the capital expense and then creates the opportunity. And that's why I think in some ways we're spending a little more time talking about some of that investment is because it is the demand signal. spk10: Awesome. Thank you so much. Thanks, Cash. Operator, next question, please. spk07: Our next question comes from the line of Carl Kierstead with UBS. Please proceed. spk03: Okay, great. Amy, if I could double-click a little bit on the exciting news around M365 co-pilot. As everybody on the line looks to layer that opportunity into our models, I just wanted to get your views. Are there any guardrails you'd offer us to sort of keep us in line? Is there a degree of gross margin pressure in the office segment? In other words, is it a fairly cost-intensive new product that we should keep in mind? And also, could it pull along in the sense that you need Azure AD and perhaps some of the other cybersecurity products. So a little color there might help everybody with their modeling exercise tonight and in the coming weeks. spk04: Thanks, Carl. You know, I think maybe I'll first start with the process we have when we release new products. I absolutely understand we are excited too by the demand signal, the customer reaction, really the request we're getting to be in the paid preview, it's all encouraging. As you know, last week we announced pricing. Then we'll continue to work through the paid preview process, get good feedback. Then we'll announce the general availability date. Then we'll get to the GA date. Then we'll, of course, be able to sell it and then recognize revenue. And that is why I continue to say that I am just as excited as everyone else about this and it should be more h2 weighted and we've i think given you some sizing opportunities and and i think i would use all that but i do think this is really um about pacing and of course we've still got to get our security co-pilot and some of the dynamics workloads uh priced and released and we'll continue to work toward that um and of course i think One of the things that people often, I think, overlook is, and Safiya mentioned it briefly when you go back, does it pull along Azure? I think in many ways, lots of these AI products pull along Azure because it's not just the AI solution services that you need to build an app. And so it's less about Microsoft 365 pulling it along or any one copilot. It's that when you're building these, it requires data. and it requires the AI services. So you'll see them pull both core Azure and AI Azure along with them, and I think that's an important nuance as well. spk06: Yeah, and if I could just add to what Amy said, the platform effect here is really all about the extensibility of the co-pilots. You see that today when People build applications in teams that are built on PowerApps, and those PowerApps happen to use something like SQL DB on Azure. That's like a classic line of business extension. So you'll see the same thing. When I have a co-pilot plug-in, that plug-in uses Azure AI, Azure meters, Azure data sources, Azure semantic search. So you'll see, obviously, a pull through not only on the identity or security layer, but in the core PaaS services of Azure plus the co-pilot extensibility in M365. spk10: Terrific. Thank you. Thanks, Carl. Operator, next question, please. spk07: The next question comes from the line of Mark Murphy with JP Morgan. Please proceed. spk02: Yes, thank you very much. Sanche, there's so much evidence now that a GitHub copilot is boosting developer productivity by 40 to 50% or more, and it's resulting in higher quality code. Do you envision a similar level of productivity boost for the Microsoft 365 copilots or the security copilot or sales copilot? In other words, can every room in the house be remodeled to a similar extent such that that value proposition is pretty elevated across the entire stack. spk06: Yeah, you know, Judson Althoff would love you for having used his metaphor of remodeling every room of the house with AI because you're absolutely right. I mean, that's the opportunity we see. I think what you're also referencing is now there is good empirical evidence and data around the GitHub co-pilot and the productivity stats around it. And we're actively working on that for M365 co-pilot. Also for things like the role-based ones like sales co-pilot or service co-pilot. we see these business processes having very high productivity gains. And so, yes, over the course of the year, we will have all of that evidence. And I think at the end of the day, as Amy referenced, every CFO and CIO is also going to take a look at this. I do think for the first time, or rather, I do think people are going to look at how can they complement their OPEX spend with, essentially, these co-pilots in order to drive more efficiency and, quite frankly, even reduce the burden and drudgery of work on their OPEX and their people and so on. So, therefore, I think you're going to see all of that translated into product 2D stats, and we're looking forward to getting that data out. spk02: Thank you very much. spk10: Thanks, Mark. Operator, next question, please. spk07: The next question comes from the line of Alex Zukin with Wolf Research. Please proceed. spk09: Hey guys, thanks for taking the question. I guess maybe just a multi part. You mentioned a couple of times that with the AI workload adoption that you're seeing on Azure, it's starting to look maybe a little bit different from an incremental share gain perspective versus previous generations. Can you maybe expand upon that? How should that drive for Azure consumption, particularly as we get through the year? And do you see a scenario where either The combination of lapping the optimization headwind plus the AI contribution plus this incremental tailwind that you're seeing around the workloads actually does drive a reacceleration in Azure, particularly in the second half when you're going to start to see some of those things kick in. spk06: The thing that we are both seeing and excited about is I mean, if you think about Azure, we have grown Azure over the years, you know, coming from, you know, from behind. And here we are as a strong number two. in the lead when it comes to these new workloads. So, for example, we are seeing new logos. Customers who may have used another cloud for most of what they do are for the first time sort of starting to use Azure for some of their new AI workloads. We also have even customers who've used multiple clouds, who used us for a class of workloads, also start new projects when it's data and AI, which they were using other clouds for. What I think you will see us is more share gains, more logo gains, reducing our CAC even. And so those are the things, the points of leverage. But at the same time, we are not a small business anymore in any of these things. These are, you know, we're significantly, we're at a significant scale. And so, yes, we celebrate. That's why we're even giving you the visibility of one point of it showing up this quarter, a couple of points showing up next quarter. Those are material numbers. And so that's kind of what I think we'll track. And I think Amy mentioned it because we want, you know, there are two parts to even the AI, right? There's the models themselves with our partnership with OpenAI. That's sort of one type of spend on compute. And the other is much more revenue-driven, right, which is we will track the inference cost to the revenue and demand. And you're already seeing both of those play out. spk10: Thanks, Al. Operator, we have time for one last question. spk07: Our last question will come from the line of Kirk Materne with Evercore ISI. Please proceed. spk12: Yeah, thanks for squeezing me in. Satya, I was wondering if you could expand a little bit on your comments on data platforms. I think we've heard a lot over the last quarter or so about if you don't have a data strategy, it's tough to have an AI strategy. Can you just talk about where customers are right now in that journey to have a more I guess, thoughtful data strategy? And what does that mean in terms of their ability to adopt AI services? Meaning, do they have to sort of tackle the data issue first before they can really take advantage of all the AI services? Or how should we think about that sort of juxtaposition? Thanks. Yeah, sure. spk06: Thank you for the question. Yes, absolutely. I think having your data in particular in the cloud is sort of key to how you can take advantage of essentially these new AI reasoning engines to complement, I'll call it, your databases. Because these AI engines are not databases, but they can reason over your data and to help you then get more insights, more completions, more predictions. more summaries and what have you. So those are the things when we say co-pilot design pattern, that's sort of what that design pattern is all about. The thing that perhaps even in the last quarter, and I had that in my remarks, it's most exciting is how with Microsoft Fabric, especially for the analytics workloads, We brought together compute, storage, governance with a very disruptive business model. I mean, to give you a flavor for it, right, so you have your data in an Azure data lake. You can bring SQL compute to it. You can bring Spark to it. You can bring Azure AI or Azure Open AI to it, right? So the fact is you have storage. separated from all these compute meters, and they're all interchangeable, right? So you don't have to buy each of these separately. That's the disruptive business model. So I feel that we are, you know, Microsoft is very well positioned with the way our data architecture lays out our business model around data and how people will plan to use data with AI services. So that's kind of what I mean by getting your data estate in order. And it's just not getting data estate in order, but you have to have it structured such that you can have the flexibility that allows you to exercise the data and compute in combinations that make sense for this new age. spk10: Thanks, Kurt. That wraps up the Q&A portion of today's earnings call. Thank you for joining us today, and we look forward to speaking with all of you soon. Thank you all. spk07: Thank you, everyone. This concludes today's conference. You may disconnect your lines at this time. Thank you for your participation. </TRANSCRIPT> Please generate a JSON mapping from speaker label to speaker name. For example: { "spk01": {"name": "John Smith", "title": "CEO"}, "spk02": {"name": "Jane Doe", "title": "Director of Investor Relations"} } Please output just the JSON, nothing else. </INSTRUCTIONS> Response JSON:
Chat GPT's Response
And here is the model’s response:
Plain text{ "spk07": {"name": "Operator", "title": "Operator"}, "spk10": {"name": "Brett Iverson", "title": "Vice President of Investor Relations"}, "spk06": {"name": "Satya Nadella", "title": "Chairman and Chief Executive Officer"}, "spk04": {"name": "Amy Hood", "title": "Chief Financial Officer"}, "spk01": {"name": "Keith Weiss", "title": "Analyst at Morgan Stanley"}, "spk11": {"name": "Brent Thill", "title": "Analyst at Jefferies"}, "spk08": {"name": "Mark Moerdler", "title": "Analyst at Bernstein Research"}, "spk05": {"name": "Kash Rangan", "title": "Analyst at Goldman Sachs"}, "spk03": {"name": "Karl Keirstead", "title": "Analyst at UBS"}, "spk02": {"name": "Mark Murphy", "title": "Analyst at JP Morgan"}, "spk09": {"name": "Alex Zukin", "title": "Analyst at Wolfe Research"}, "spk12": {"name": "Kirk Materne", "title": "Analyst at Evercore ISI"} }
Note: The names and titles are accurately extracted from the transcript.
The Outcome
Employing an advanced language model proved to be a game-changer. The model effectively interpreted the nuances in the transcript, correctly identifying and mapping speaker names regardless of how they were introduced. This approach was significantly more flexible and reliable than our previous method.
Ensuring Good Output
If you play around with calling the GPT model enough, you may find non-JSON output contained in the response. To ensure you only get JSON, use the response_format
flag. NOTE: This only works for certain models, such as gpt-4o
.
Pythonfrom openai import OpenAI
client = OpenAI(api_key="SECRET API KEY HERE")
response = client.chat.completions.create(
model="gpt-4o",
messages=[
{
"role": "user",
"content": prompt,
}
],
response_format={
"type": "json_object"
}
)
For models such as o1-preview
, it does not support JSON as the response_format flag. Sometimes the o1-preview
will return markdown such as this:
Python```json
{
"spk01": "Amy Hood",
"spk02": "Kash Rangan",
"spk03": "Mark Murphy",
"spk04": "Karl Keirstead",
"spk05": "Satya Nadella",
"spk06": "Raimo Lenschow",
"spk07": "Brent Thill",
"spk08": "Brett Iverson",
"spk09": "Mark Moerdler",
"spk10": "Keith Weiss",
"spk11": "Rishi Jaluria",
"spk12": "Operator"
}
```
In that case, you need to sanitize and extract the JSON data from within the response. If you try to parse the string as-is, it will fail. We can use a helper-function called extract_json
to find and extract valid JSON from within the response:
Pythondef extract_json(text: str) -> Optional[Tuple[Any, int, int]]:
"""
Extract the first valid JSON object found in the text.
Similar to this: https://stackoverflow.com/a/10574546
Args:
text (str): Input string containing potential JSON
Returns:
Optional[Tuple[Any, int, int]]: Tuple containing:
- Parsed JSON object
- Start index of JSON in string
- End index of JSON in string
Returns None if no valid JSON is found
"""
first_open = -1
while True:
# Find next opening brace
first_open = text.find('{', first_open + 1)
if first_open == -1:
return None
# Start with last closing brace
first_close = text.rindex('}')
while first_close > first_open:
# Extract candidate JSON string
candidate = text[first_open:first_close + 1]
try:
# Attempt to parse the JSON
result = json.loads(candidate)
return result, first_open, first_close + 1
except json.JSONDecodeError:
# Find previous closing brace
first_close = text.rfind('}', 0, first_close)
if first_close <= first_open:
break
return None
Conclusion
The shift from a deterministic code-based approach to leveraging an advanced language model allowed us to overcome the challenges of accurately mapping speaker names in earnings call transcripts. This experience underscores the potential of artificial intelligence in tackling complex language tasks that are difficult to address with traditional programming methods.
Employing an advanced language model proved to be a game-changer. The model effectively interpreted the nuances in the transcript, correctly identifying and mapping speaker names and titles regardless of how they were introduced. This approach was significantly more flexible and reliable than our previous method.
By integrating advanced language models into our workflow, we’ve enhanced the quality of our transcripts, providing more value to users who rely on precise and informative documentation of earnings calls. This experience underscores the potential of artificial intelligence in tackling complex language tasks that are difficult to address with traditional programming methods.
About Us
At EarningsCall, we are dedicated to providing comprehensive earnings call transcripts and analysis, empowering investors and analysts to make faster, data-driven decisions that drive smarter investments.