@inproceedings{43f2e6ffb28447cebfbdb7387689eaed,
title = "On extracting session data from activity logs",
abstract = "Activity logs from large-scale systems facilitate the study of user behavior, which can be used to improve and tune the user experience. However, the available data often lacks important elements such as the identification of user sessions. Previous work typically compensated for this by setting a threshold of around 30 minutes, and assuming that breaks in activity longer than the threshold reflect breaks between sessions. We show that using such a global threshold introduces artifacts that may affect the analysis, because there is a high probability that long sessions are not identified correctly. As an alternative, we suggest that a suitable individual threshold be found for each user, based on that user's activity pattern. Applying this approach to a large dataset from the AOL search engine leads to a distribution of session durations that is free of artifacts like those that appear when using a global threshold.",
keywords = "activity log, session, user behavior",
author = "David Mehrzadi and Feitelson, {Dror G.}",
year = "2012",
doi = "https://doi.org/10.1145/2367589.2367592",
language = "الإنجليزيّة",
isbn = "9781450314480",
series = "ACM International Conference Proceeding Series",
booktitle = "Proceedings of the 5th Annual International Systems and Storage Conference, SYSTOR'12",
note = "5th Annual International Systems and Storage Conference, SYSTOR 2012 ; Conference date: 04-06-2012 Through 06-06-2012",
}