from mixpeek import Mixpeek
mix = Mixpeek(mixpeek_key="API_KEY")
# index our PPT file
mix.extract("file.ppt")
# now we have clean PPT data
[
{
"filename": "file.ppt",
"content": "This is the content of the ppt file".
"embedding": [0.1, 0.2, 0.3, ...]
"metadata": {
"author": "John Doe",
"date": "2022-01-01"
}
}
]
Read the Docs