Unsupervised Machine Learning and Data Mining DS 5230 / DS 4420 - Fall 2018 Lecture 16 Jan-Willem van de Meent
TOPIC MODELS (part 3) Borrowing from : David Blei (Columbia)
<latexit sha1_base64="z341rKqmpSRsPhmRMI2yHmkQTe8=">AGcXicfZTrTtswFIBTLh3LbrD9mvangIRAq1ACPgzCbGh7SdD3CRcVU5y2lpNnMx2oGD5UfYme5E9x15gdhpGE0dzperI5zs3n5MTZDHhwvN+t+bmFxbz5aeuy9evnr9Znl7SVPcxbCRZjGKbsOMIeYULgQRMRwnTHASRDVTD+bPRXt8A4Sem5uM+gl+AhJQMSYqGv+s/0a1EYRDLB6X6MupS1XE3ECdJx0UCJkJ+ITxkIEBtFpjBxQgELnC15SLkFi6GTE7+uUAJiTqP/JNntPoJrXbG7oZrIjQEYFERIJj6H2/1l9e9ba84HVvwS2H9yJme0/7Kwi8UpWGeABVhjDm/8b1M9CRmgoQxKBflHDIcjvEQbrRIcQK8J4t31JXPas/9nhykVANK2YSJzBYmRdGphXb8ORDgysGra87EnjJQJOhrRqFSTKdVEA93TIjMZBXEOSp59PVbS6+7vdv2dA1VDGEQl4R96Xf2rA0MGQEvkcK/r7x/aTJazLIYnyDOYyYBhbswTRJMTY8gVDf6fRBQnjMwheiuJXLdV0pZ8BTVNoXeRbPKiZJ6eGYT1AMwUXsfgYzhWro3oIemnw9WNiPJuxqK3sRTON8wY2t9jchpgFsXqG0BgTMk7ilFr1DGboYk4GdtB4hil7bFzGelFE2PKYjZrxbEQs9qzWmTNlxmWwGyYN1nlGbAsEiZ+ejuiBjFJCGCy1KvbCtC/2+l9fVgJ6o6lOY/COSJski9nYrBrL6dPaF6KVU5U2UDNmRVbNq4BjCrgeUDG1LvO7+3Wzhcmfb1/L3vfWj43LzLTkfnDVn0/GdA+fI+eacOhdO2JpvbV2WruLf9rv2532hSda5U275zKaX/8C/vUWpY=</latexit> <latexit sha1_base64="z341rKqmpSRsPhmRMI2yHmkQTe8=">AGcXicfZTrTtswFIBTLh3LbrD9mvangIRAq1ACPgzCbGh7SdD3CRcVU5y2lpNnMx2oGD5UfYme5E9x15gdhpGE0dzperI5zs3n5MTZDHhwvN+t+bmFxbz5aeuy9evnr9Znl7SVPcxbCRZjGKbsOMIeYULgQRMRwnTHASRDVTD+bPRXt8A4Sem5uM+gl+AhJQMSYqGv+s/0a1EYRDLB6X6MupS1XE3ECdJx0UCJkJ+ITxkIEBtFpjBxQgELnC15SLkFi6GTE7+uUAJiTqP/JNntPoJrXbG7oZrIjQEYFERIJj6H2/1l9e9ba84HVvwS2H9yJme0/7Kwi8UpWGeABVhjDm/8b1M9CRmgoQxKBflHDIcjvEQbrRIcQK8J4t31JXPas/9nhykVANK2YSJzBYmRdGphXb8ORDgysGra87EnjJQJOhrRqFSTKdVEA93TIjMZBXEOSp59PVbS6+7vdv2dA1VDGEQl4R96Xf2rA0MGQEvkcK/r7x/aTJazLIYnyDOYyYBhbswTRJMTY8gVDf6fRBQnjMwheiuJXLdV0pZ8BTVNoXeRbPKiZJ6eGYT1AMwUXsfgYzhWro3oIemnw9WNiPJuxqK3sRTON8wY2t9jchpgFsXqG0BgTMk7ilFr1DGboYk4GdtB4hil7bFzGelFE2PKYjZrxbEQs9qzWmTNlxmWwGyYN1nlGbAsEiZ+ejuiBjFJCGCy1KvbCtC/2+l9fVgJ6o6lOY/COSJski9nYrBrL6dPaF6KVU5U2UDNmRVbNq4BjCrgeUDG1LvO7+3Wzhcmfb1/L3vfWj43LzLTkfnDVn0/GdA+fI+eacOhdO2JpvbV2WruLf9rv2532hSda5U275zKaX/8C/vUWpY=</latexit> <latexit sha1_base64="z341rKqmpSRsPhmRMI2yHmkQTe8=">AGcXicfZTrTtswFIBTLh3LbrD9mvangIRAq1ACPgzCbGh7SdD3CRcVU5y2lpNnMx2oGD5UfYme5E9x15gdhpGE0dzperI5zs3n5MTZDHhwvN+t+bmFxbz5aeuy9evnr9Znl7SVPcxbCRZjGKbsOMIeYULgQRMRwnTHASRDVTD+bPRXt8A4Sem5uM+gl+AhJQMSYqGv+s/0a1EYRDLB6X6MupS1XE3ECdJx0UCJkJ+ITxkIEBtFpjBxQgELnC15SLkFi6GTE7+uUAJiTqP/JNntPoJrXbG7oZrIjQEYFERIJj6H2/1l9e9ba84HVvwS2H9yJme0/7Kwi8UpWGeABVhjDm/8b1M9CRmgoQxKBflHDIcjvEQbrRIcQK8J4t31JXPas/9nhykVANK2YSJzBYmRdGphXb8ORDgysGra87EnjJQJOhrRqFSTKdVEA93TIjMZBXEOSp59PVbS6+7vdv2dA1VDGEQl4R96Xf2rA0MGQEvkcK/r7x/aTJazLIYnyDOYyYBhbswTRJMTY8gVDf6fRBQnjMwheiuJXLdV0pZ8BTVNoXeRbPKiZJ6eGYT1AMwUXsfgYzhWro3oIemnw9WNiPJuxqK3sRTON8wY2t9jchpgFsXqG0BgTMk7ilFr1DGboYk4GdtB4hil7bFzGelFE2PKYjZrxbEQs9qzWmTNlxmWwGyYN1nlGbAsEiZ+ejuiBjFJCGCy1KvbCtC/2+l9fVgJ6o6lOY/COSJski9nYrBrL6dPaF6KVU5U2UDNmRVbNq4BjCrgeUDG1LvO7+3Wzhcmfb1/L3vfWj43LzLTkfnDVn0/GdA+fI+eacOhdO2JpvbV2WruLf9rv2532hSda5U275zKaX/8C/vUWpY=</latexit> <latexit sha1_base64="XFcmVykVZPeM9+UfOx4QUqSbsI=">AGcXicfZTrTtswFIBTLh3LbrD9mvangIRAq1ACPgzCbGh7SdD3CRcVU5y2lpNnMx2oGD5UfYme5E9x15gdhpGE0dzperI5zs3n5MTZDHhwvN+t+bmFxbz5aeuy9evnr9Znl7SVPcxbCRZjGKbsOMIeYULgQRMRwnTHASRDVTD+bPRXt8A4Sem5uM+gl+AhJQMSYqGv+s/0a1EYRDLB6X6MupS1XE3ECdJx0UCJkJ+ITxkIEBtFpjBxQgELnC15SLkFi6GTE7+uUAJiTqP/JNntPoJrXbG7oZrIjQEYFERIJj6H2/1l9e9ba84HVvwS2HdKc9pf2XhF4rSME+AijDGnN/4XiZ6EjNBwhiUi3IOGQ7HeAg3WqQ4Ad6TxTvqyme1535PDlIqgIYVM4kTnmAxsi4NzKu34UgHBlYNW172pPESASdDWrUKEuW6KIKB7mRmYyCOAclz74eK+l193e7/s6BqiEMopLwD72u/tWBIQOgJXK41/X3D20my1kWwxPkGcxkw4DCXZgmCamRxCqG/0+CjPGZhCdNcSue4rpSx4imqbQu+iWeVEST08swnqAZioOnY/g5lCNXRvQ9Nvh4s7EcT9jUVvaimcZ5A5tbG5DzIJYPUNojAkZJ3FKrXoGM3QxJwM7aDzDlD02LmO9KCJsecxGzXg2IhZ7VuvMmTLjMktgNkyw7jNKM2BYpMx8dHdEjGKSEMFlqVe2FaH/t9L6erATVR1K8x8E8kRZpN5OxWBW386eUL2UqpypsgEbsio2bVwDmNXA8oENqfedX9utnC5s+1r+fve+tFxufmWnA/OmrPp+M6Bc+R8c06dCydszbe2Wjut3cU/7ftTntis61Spt3TuW0P/4FqgVaVg=</latexit> Review: Topic Modeling β k : Topics x d: Words z d : Assignments θ d : Topic Proportions (document-specific) (shared) gene 0.04 dna 0.02 genetic 0.01 .,, life 0.02 evolve 0.01 organism 0.01 .,, brain 0.04 neuron 0.02 nerve 0.01 ... data 0.02 number 0.02 computer 0.01 .,, z d , n ∼ Discrete ( θ d ) x d , n | z d , n = k ∼ Discrete ( β k )
Recommend
More recommend