215 lines
5.2 KiB
Go
215 lines
5.2 KiB
Go
package statistics
|
|
|
|
import (
|
|
"context"
|
|
"database/sql"
|
|
"fmt"
|
|
"penahub.gitlab.yandexcloud.net/backend/quiz/common.git/utils"
|
|
"sort"
|
|
"strings"
|
|
)
|
|
|
|
type DepsClick struct {
|
|
Conn *sql.DB
|
|
}
|
|
|
|
type StatisticClick struct {
|
|
conn *sql.DB
|
|
}
|
|
|
|
func NewClickStatistic(ctx context.Context, deps DepsClick) (*StatisticClick, error) {
|
|
s := &StatisticClick{
|
|
conn: deps.Conn,
|
|
}
|
|
|
|
err := s.checkMW(ctx)
|
|
if err != nil {
|
|
fmt.Println("error check material view existing", err)
|
|
return nil, err
|
|
}
|
|
|
|
return s, nil
|
|
}
|
|
|
|
func (s *StatisticClick) checkMW(ctx context.Context) error {
|
|
query := `
|
|
CREATE MATERIALIZED VIEW IF NOT EXISTS mv_last_answers_events
|
|
ENGINE = MergeTree()
|
|
ORDER BY (ctxsession, event_time) POPULATE AS
|
|
SELECT
|
|
event_time, ctxsession, ctxquizid, ctxquestionid, ctxidint, message, keyos,
|
|
ctxuserip, ctxuserport, keydomain, keypath, ctxquiz, ctxreferrer
|
|
FROM (SELECT
|
|
event_time, ctxsession, ctxquizid, ctxquestionid, ctxidint, message, keyos,
|
|
ctxuserip, ctxuserport, keydomain, keypath, ctxquiz, ctxreferrer,
|
|
row_number() OVER (PARTITION BY ctxsession ORDER BY event_time DESC) as row_num
|
|
FROM statistics
|
|
WHERE message IN ('InfoQuizOpen', 'InfoAnswer', 'InfoResult') AND event_level = 'info') AS sorted
|
|
WHERE row_num = 1;
|
|
`
|
|
_, err := s.conn.ExecContext(ctx, query)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
}
|
|
|
|
type Statistic struct {
|
|
Count int64
|
|
QuestionID int64
|
|
}
|
|
|
|
type PipeLineStatsResp [][]Statistic
|
|
|
|
// пример:
|
|
//"[0, 116783, 116810]"
|
|
//"[0, 116783, 116798]"
|
|
//"[0, 116783, 116798, 116831]"
|
|
//"[0, 116783, 116810, 116849]"
|
|
//[0]
|
|
//"[0, 116783]"
|
|
//"[0, 116783, 116810, 116843]"
|
|
|
|
//SELECT DISTINCT last_que, reversed
|
|
//FROM ( SELECT groupArray(ctxquestionid) AS reversed, arraySlice(arrayReverse(groupArray(ctxquestionid)), 1, 1)[1] AS last_que
|
|
//FROM statistics WHERE ctxquizid = 26276 GROUP BY ctxsession ) AS sub;
|
|
|
|
func (s *StatisticClick) getFunnel(ctx context.Context, quizID int64, from uint64, to uint64) (map[int64][]int64, error) {
|
|
query := `
|
|
SELECT DISTINCT last_que, reversed
|
|
FROM ( SELECT groupArray(ctxquestionid) AS reversed, arraySlice(arrayReverse(groupArray(ctxquestionid)), 1, 1)[1] AS last_que
|
|
FROM statistics WHERE ctxquizid = ? AND event_time BETWEEN ? AND ? GROUP BY ctxsession ) AS sub;
|
|
`
|
|
|
|
rows, err := s.conn.QueryContext(ctx, query, quizID, from, to)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
defer rows.Close()
|
|
|
|
funnel := make(map[int64][]int64)
|
|
for rows.Next() {
|
|
var lastQue int64
|
|
var reversed []int64
|
|
if err := rows.Scan(&lastQue, &reversed); err != nil {
|
|
return nil, err
|
|
}
|
|
funnel[lastQue] = reversed
|
|
}
|
|
|
|
if err := rows.Err(); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
result := make(map[int64][]int64)
|
|
keys := make([]int64, 0, len(funnel))
|
|
for key := range funnel {
|
|
keys = append(keys, key)
|
|
}
|
|
sort.Slice(keys, func(i, j int) bool {
|
|
return keys[i] < keys[j]
|
|
})
|
|
|
|
for _, lastQue := range keys {
|
|
reversed := funnel[lastQue]
|
|
found := false
|
|
|
|
for _, otherLastQue := range keys {
|
|
if otherLastQue != lastQue {
|
|
otherReversed := funnel[otherLastQue]
|
|
index := utils.BinarySearch(lastQue, otherReversed)
|
|
if index {
|
|
found = true
|
|
break
|
|
}
|
|
}
|
|
}
|
|
|
|
if !found {
|
|
result[lastQue] = reversed
|
|
}
|
|
}
|
|
|
|
return result, nil
|
|
}
|
|
|
|
func (s *StatisticClick) GetPipelinesStatistics(ctx context.Context, quizID int64, from uint64, to uint64) (PipeLineStatsResp, error) {
|
|
var pipelines PipeLineStatsResp
|
|
|
|
// получили id вопросов воронок где массив состоит из 1 элемента
|
|
funnel, err := s.getFunnel(ctx, quizID, from, to)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
var idS []int64
|
|
for queID := range funnel {
|
|
idS = append(idS, queID)
|
|
}
|
|
|
|
if len(idS) == 0 {
|
|
return nil, nil
|
|
}
|
|
// тут считаем количество ответов на эти вопросы по уникальным сессиям
|
|
sesCount, err := s.countSession(ctx, quizID, from, to, idS)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
for questionID := range funnel {
|
|
if sessionCount, ok := sesCount[questionID]; ok {
|
|
pipeline := []Statistic{
|
|
{
|
|
QuestionID: questionID,
|
|
Count: sessionCount,
|
|
},
|
|
}
|
|
pipelines = append(pipelines, pipeline)
|
|
}
|
|
}
|
|
|
|
return pipelines, nil
|
|
}
|
|
|
|
func (s *StatisticClick) countSession(ctx context.Context, quizID int64, from uint64, to uint64, questionIDs []int64) (map[int64]int64, error) {
|
|
placeholders := make([]string, len(questionIDs))
|
|
args := make([]interface{}, len(questionIDs)+3)
|
|
args[0] = quizID
|
|
for i, id := range questionIDs {
|
|
placeholders[i] = "?"
|
|
args[i+1] = id
|
|
}
|
|
args[len(args)-2] = from
|
|
args[len(args)-1] = to
|
|
|
|
query := fmt.Sprintf(`
|
|
SELECT ctxquestionid, COUNT(DISTINCT ctxsession) AS session_count
|
|
FROM statistics
|
|
WHERE ctxquizid = ? AND ctxquestionid IN (%s) AND event_time BETWEEN ? AND ?
|
|
GROUP BY ctxquestionid;
|
|
`, strings.Join(placeholders, ","))
|
|
|
|
rows, err := s.conn.QueryContext(ctx, query, args...)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
defer rows.Close()
|
|
|
|
counts := make(map[int64]int64)
|
|
|
|
for rows.Next() {
|
|
var questionID int64
|
|
var count int64
|
|
err := rows.Scan(&questionID, &count)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
counts[questionID] = count
|
|
}
|
|
|
|
if err := rows.Err(); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return counts, nil
|
|
}
|