diff --git a/data-computer/v1/lda.py b/data-computer/v1/lda.py index 9e467ab..53d1fb7 100755 --- a/data-computer/v1/lda.py +++ b/data-computer/v1/lda.py @@ -77,14 +77,15 @@ topics = lda_model[doc_bow] topic_info = {} for topic_id, topic_weight in topics: + topic_info[f"topic_{topic_id + 1}"] = {} topic_words = [word for word, _ in lda_model.show_topic(topic_id)] - topic_info[f"topic {topic_id + 1}"] = topic_words - topic_info[f"weight {topic_id + 1}"] = str(topic_weight) + topic_info[f"topic_{topic_id + 1}"]["words"] = topic_words + topic_info[f"topic_{topic_id + 1}"]["weight"] = str(topic_weight) line["lda"]= topic_info # Write all corpus in once for line in all_data: - sys.stdout.write(json.dumps(all_data)) + sys.stdout.write(json.dumps(line)) sys.stdout.write("\n")