databaseRead.go 8.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310
  1. package lib
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "sort"
  6. )
  7. //topicPointer and textPointer should not be exported
  8. //mb move tweet reconstruction to dbRead from servers
  9. type Tweet struct {
  10. TopicPointer string
  11. TextPointer int
  12. Topics []string
  13. Text string
  14. RoundPosted int
  15. }
  16. var dbR = make(map[string][]Tweet)
  17. var archive = make(map[string][]Tweet)
  18. //needs to be dividable by roundsBeforUpdate
  19. var roundsBeforeArchiving = 12
  20. var roundsBeforeArchivingInc = roundsBeforeArchiving
  21. var bytesSaved float64
  22. var topicList []string
  23. var archiveTopicList []string
  24. func NewEntries(inputTweets []Tweet, whereTo int) {
  25. tmpdb := dbR
  26. if whereTo == 1 {
  27. tmpdb = archive
  28. }
  29. var position int = 0
  30. for _, tweet := range inputTweets {
  31. for index := range tweet.Topics {
  32. //new topic
  33. if _, ok := tmpdb[tweet.Topics[index]]; !ok {
  34. if whereTo == 0 {
  35. topicList = append(topicList, tweet.Topics[index])
  36. } else {
  37. archiveTopicList = append(archiveTopicList, tweet.Topics[index])
  38. }
  39. }
  40. //new tweet
  41. if index == 0 {
  42. position = len(tmpdb[tweet.Topics[0]])
  43. tmpdb[tweet.Topics[index]] = append(tmpdb[tweet.Topics[0]], tweet)
  44. } else {
  45. //known tweet
  46. //setting pointer for all other Topics
  47. if whereTo == 1 {
  48. bytesSaved += float64(len(tweet.Topics)) + float64(len(tweet.Text))
  49. }
  50. topic := tweet.Topics[index]
  51. var pointerTweet Tweet
  52. pointerTweet.TopicPointer = tweet.Topics[0]
  53. pointerTweet.TextPointer = position
  54. pointerTweet.Topics = nil
  55. pointerTweet.Text = ""
  56. tmpdb[topic] = append(tmpdb[topic], pointerTweet)
  57. }
  58. }
  59. }
  60. if whereTo == 0 {
  61. dbR = tmpdb
  62. } else {
  63. archive = tmpdb
  64. }
  65. }
  66. //todo! add round to pirquery only get tweets that have been posted from that round onward
  67. func GetTweets(pirQuery []byte, dataLength int, whereFrom int, pubKey [32]byte) []byte {
  68. tmpdb := dbR
  69. if whereFrom == 1 {
  70. tmpdb = archive
  71. }
  72. var wantedTopics = getNamesForTopics(pirQuery, whereFrom)
  73. tweetsToReturn := make([][]Tweet, len(wantedTopics))
  74. for index, wantedTopic := range wantedTopics {
  75. for _, tweet := range tmpdb[wantedTopic] {
  76. //new Tweet
  77. if tweet.Text != "" {
  78. tweet.RoundPosted = 0
  79. tweetsToReturn[index] = append(tweetsToReturn[index], tweet)
  80. } else {
  81. //"copied" tweet
  82. //find tweet with pointers
  83. tweet = tmpdb[tweet.TopicPointer][tweet.TextPointer]
  84. tweet.RoundPosted = 0
  85. tweetsToReturn[index] = append(tweetsToReturn[index], tweet)
  86. }
  87. }
  88. }
  89. return tweetsToByteArray(tweetsToReturn, whereFrom, wantedTopics, dataLength)
  90. }
  91. func getNamesForTopics(wantedIndices []byte, whereFrom int) []string {
  92. var topicNames []string
  93. tmpTopicList := topicList
  94. if whereFrom == 1 {
  95. tmpTopicList = archiveTopicList
  96. }
  97. for index, element := range wantedIndices {
  98. if index == len(tmpTopicList) {
  99. break
  100. }
  101. if element == 1 {
  102. topicNames = append(topicNames, tmpTopicList[index])
  103. }
  104. }
  105. return topicNames
  106. }
  107. //transform struct to byte array for sending
  108. func tweetsToByteArray(tweetsToReturn [][]Tweet, whereFrom int, wantedTopics []string, dataLength int) []byte {
  109. //factor is an estimated nr that works, there probably is a smarter way to do this
  110. factor := 0.4
  111. minimumBlockSize := int(factor * float64(dataLength*maxLength(whereFrom)))
  112. tweetsAsBytes := make([]byte, minimumBlockSize)
  113. for _, block := range tweetsToReturn {
  114. var topicPadding []string
  115. var blockToAppend []byte
  116. for index, tweet := range block {
  117. for topicIndex, topic := range tweet.Topics {
  118. blockToAppend = append(blockToAppend, []byte(topic)...)
  119. blockToAppend = append(blockToAppend, ","...)
  120. //gets the topic used for padding
  121. if topicIndex > 0 && index < len(wantedTopics) && topic != wantedTopics[index] {
  122. topicPadding = append(topicPadding, topic)
  123. }
  124. }
  125. //replaces last "," with ";;" bc there is text following and not another topic
  126. blockToAppend = blockToAppend[:len(blockToAppend)-1]
  127. blockToAppend = append(blockToAppend, []byte(";;")[:]...)
  128. blockToAppend = append(blockToAppend, []byte(tweet.Text)...)
  129. blockToAppend = append(blockToAppend, []byte(";")[0])
  130. }
  131. //adds padding
  132. blockToAppend = append(blockToAppend, []byte(";;;")[:]...)
  133. remainingLength := minimumBlockSize - len(blockToAppend)
  134. //grouping using topic from recovered tweets
  135. index := len(topicPadding) - 1
  136. for index >= 0 && remainingLength > 0 && topicPadding[index] != "" {
  137. paddingTweet, err := getNextTweet(topicPadding[index], index, whereFrom)
  138. if err {
  139. break
  140. }
  141. if remainingLength < len(paddingTweet) {
  142. break
  143. }
  144. blockToAppend = append(blockToAppend, paddingTweet...)
  145. remainingLength -= len(paddingTweet)
  146. index--
  147. }
  148. padding := bytes.Repeat([]byte(";"), remainingLength)
  149. blockToAppend = append(blockToAppend, padding...)
  150. Xor(blockToAppend, tweetsAsBytes)
  151. }
  152. return tweetsAsBytes
  153. }
  154. func maxLength(whereFrom int) int {
  155. tmpdb := dbR
  156. if whereFrom == 1 {
  157. tmpdb = archive
  158. }
  159. var max int = 0
  160. for i := range tmpdb {
  161. nrOfTweets := len(tmpdb[i])
  162. if nrOfTweets > max {
  163. max = nrOfTweets
  164. }
  165. }
  166. return max
  167. }
  168. //gets the Tweet at index from wantedTopic for padding
  169. func getNextTweet(wantedTopic string, index, whereFrom int) ([]byte, bool) {
  170. tmpdb := dbR
  171. if whereFrom == 1 {
  172. tmpdb = archive
  173. }
  174. var tweetToReturn Tweet
  175. for tweetIndex, tweet := range tmpdb[wantedTopic] {
  176. if len(tmpdb[wantedTopic]) <= index {
  177. return nil, true
  178. } else if tweetIndex < index {
  179. continue
  180. } else if tweetIndex > index {
  181. break
  182. }
  183. //new Tweet
  184. if tweet.Text != "" {
  185. tweet.RoundPosted = 0
  186. tweetToReturn = tweet
  187. } else {
  188. //"copied" tweet
  189. //find tweet with pointers
  190. tweet = tmpdb[tweet.TopicPointer][tweet.TextPointer]
  191. tweet.RoundPosted = 0
  192. tweetToReturn = tweet
  193. }
  194. }
  195. var tweetToReturnBytes []byte
  196. for _, topic := range tweetToReturn.Topics {
  197. tweetToReturnBytes = append(tweetToReturnBytes, []byte(topic)...)
  198. tweetToReturnBytes = append(tweetToReturnBytes, ","...)
  199. }
  200. //replaces last "," with ";;" bc there is text following and not another topic
  201. tweetToReturnBytes = tweetToReturnBytes[:len(tweetToReturnBytes)-1]
  202. tweetToReturnBytes = append(tweetToReturnBytes, []byte(";;")[:]...)
  203. tweetToReturnBytes = append(tweetToReturnBytes, []byte(tweetToReturn.Text)...)
  204. tweetToReturnBytes = append(tweetToReturnBytes, []byte(";")[0])
  205. return tweetToReturnBytes, false
  206. }
  207. //see func name
  208. func GetTopicList(whereFrom int) ([]byte, int) {
  209. tmpTopicList := topicList
  210. if whereFrom == 1 {
  211. tmpTopicList = archiveTopicList
  212. }
  213. if (len(tmpTopicList)) == 0 {
  214. return nil, 0
  215. }
  216. topicByteArray := new(bytes.Buffer)
  217. json.NewEncoder(topicByteArray).Encode(tmpTopicList)
  218. return topicByteArray.Bytes(), len(tmpTopicList)
  219. }
  220. //iterates through full dbR and moves old tweets to archive
  221. func CleanUpdbR(round int) {
  222. if roundsBeforeArchiving == -1 {
  223. return
  224. }
  225. if roundsBeforeArchivingInc-round == 0 {
  226. keys := make([]string, len(dbR))
  227. i := 0
  228. for k := range dbR {
  229. keys[i] = k
  230. i++
  231. }
  232. sort.Strings(keys)
  233. var tweetsToArchive []Tweet
  234. for _, topic := range keys {
  235. tweets := dbR[topic]
  236. for i := len(tweets) - 1; i >= 0; i-- {
  237. if round-roundsBeforeArchiving >= tweets[i].RoundPosted {
  238. //only adds the tweet to the archive when there is text
  239. if tweets[i].Text != "" {
  240. tweetsToArchive = append(tweetsToArchive, tweets[i])
  241. }
  242. //delets the tweet from the array
  243. row := append(tweets[:i], tweets[i+1:]...)
  244. tweets = row
  245. }
  246. }
  247. dbR[topic] = tweets
  248. }
  249. NewEntries(tweetsToArchive, 1)
  250. roundsBeforeArchivingInc += roundsBeforeArchiving
  251. //redoes the whole dbR to correct pointers
  252. var tweetsToMain []Tweet
  253. for _, topic := range keys {
  254. tweets := dbR[topic]
  255. for _, tweet := range tweets {
  256. if tweet.Text != "" {
  257. tweetsToMain = append(tweetsToMain, tweet)
  258. }
  259. }
  260. }
  261. dbR = nil
  262. dbR = make(map[string][]Tweet)
  263. topicList = nil
  264. NewEntries(tweetsToMain, 0)
  265. }
  266. }
  267. func GetBytesSaved() float64 {
  268. return bytesSaved / float64(len(archive))
  269. }