diff options
author | "Vincent Ambo ext:(%22) <tazjin@me.com> | 2012-02-22T21·03+0100 |
---|---|---|
committer | "Vincent Ambo ext:(%22) <tazjin@me.com> | 2012-02-22T21·03+0100 |
commit | b951faa6b4771693f08b4002c771a508904d97a1 (patch) | |
tree | 93177791ac00c21ea864920db9ed6faefee4bea3 /tools/convertdb |
* initial checkin
Diffstat (limited to 'tools/convertdb')
-rw-r--r-- | tools/convertdb/.DS_Store | bin | 0 -> 6148 bytes | |||
-rw-r--r-- | tools/convertdb/Makefile | 13 | ||||
-rw-r--r-- | tools/convertdb/convertdb.go | 121 | ||||
-rw-r--r-- | tools/convertdb/couch.go | 403 |
4 files changed, 537 insertions, 0 deletions
diff --git a/tools/convertdb/.DS_Store b/tools/convertdb/.DS_Store new file mode 100644 index 000000000000..5de3023c9b98 --- /dev/null +++ b/tools/convertdb/.DS_Store Binary files differdiff --git a/tools/convertdb/Makefile b/tools/convertdb/Makefile new file mode 100644 index 000000000000..eba288ec1d5b --- /dev/null +++ b/tools/convertdb/Makefile @@ -0,0 +1,13 @@ +all: convertdb + +convertdb: couch.8 convertdb.8 + 8l -o convertdb convertdb.8 + +convertdb.8: convertdb.go + 8g convertdb.go + +couch.8: couch.go + 8g couch.go + +clean: + rm -rf *.8 convertdb diff --git a/tools/convertdb/convertdb.go b/tools/convertdb/convertdb.go new file mode 100644 index 000000000000..adef31910bf1 --- /dev/null +++ b/tools/convertdb/convertdb.go @@ -0,0 +1,121 @@ +package main + +import ( + "strconv" + "fmt" + "io/ioutil" + "json" + "./couch" + "os" + "time" +) + +//old +type OldComment struct { + Author string + Text string + Date string +} + +type OldEntry struct { + Id string + Title string + Author string + Text string + Mtext string + Comments []OldComment +} + +//new +type Comment struct { + Author string `json:"cauthor"` + Text string `json:"ctext"` + Date int64 `json:"cdate"` +} + +type Entry struct { + Id string `json:"_id"` + Year int `json:"year"` + Month int `json:"month"` + Day int + Lang string `json:"lang"` + Title string `json:"title"` + Author string `json:"author"` + Text string `json:"text"` + Mtext string `json:"mtext"` + Comments []Comment `json:"comments"` +} + +func main() { + getAllByYear("2011", 8, 12) + getAllByYear("2012", 1, 2) +} + +func getAllByYear(year string, minm, maxm int){ + db, _ := couch.NewDatabase("127.0.0.1", "5984", "tazblog") + for i:=minm;i<=maxm;i++{ + dirList, err := ioutil.ReadDir(fmt.Sprintf("data/%s/%02d/", year, i)) + if err != nil { + fmt.Println(err.String()) + os.Exit(1) + } + for d:=len(dirList)-1; d>-1; d--{ + content, cErr := ioutil.ReadFile(fmt.Sprintf("data/%s/%02d/%s", year, i, dirList[d].Name)) + if cErr != nil { + fmt.Println(cErr) + os.Exit(1) + } + var oEntry OldEntry + jErr := json.Unmarshal(content, &oEntry) + if jErr != nil { + fmt.Println(jErr.String()) + os.Exit(1) + } + nEntry := convertEntry(oEntry, fmt.Sprintf("data/%s/%02d/%s", year, i, dirList[d].Name)) + eId, _, err := db.Insert(nEntry) + if err != nil { + fmt.Println(err.String()) + os.Exit(1) + } + fmt.Println("Inserted " + eId) + } + } +} + +func convertEntry(oEntry OldEntry, p string) Entry{ + var nEntry Entry + nComments := make([]Comment, len(oEntry.Comments)) + for i:=0;i<len(oEntry.Comments);i++{ + nComments[i].Author = oEntry.Comments[i].Author + nComments[i].Text = oEntry.Comments[i].Text + nComments[i].Date = parseDumbTime(oEntry.Comments[i].Date) + } + + nEntry.Id = oEntry.Id[3:] + nEntry.Year, _ = strconv.Atoi(p[5:9]) + nEntry.Month, _ = strconv.Atoi(p[10:12]) + nEntry.Day, _ = strconv.Atoi(p[13:15]) + nEntry.Title = oEntry.Title + nEntry.Author = oEntry.Author + nEntry.Mtext = oEntry.Mtext + nEntry.Text = oEntry.Text + nEntry.Comments = nComments + nEntry.Lang = "de" + + return nEntry +} + +//http://tazj.in/2012/02/10.155234 +func parseEntryTime(year, month, day int, ids string) string { + x := fmt.Sprintf() +} + +func parseDumbTime(Year, Month, Day int, ) int64 { + x, err := time.Parse("[Am 02.01.2006 um 15:04 Uhr]", ct) + if err != nil { + fmt.Println(err.String()) + os.Exit(1) + } + + return x.Seconds() +} diff --git a/tools/convertdb/couch.go b/tools/convertdb/couch.go new file mode 100644 index 000000000000..764eb49a6099 --- /dev/null +++ b/tools/convertdb/couch.go @@ -0,0 +1,403 @@ +// -*- tab-width: 4 -*- +package couch + +import ( + "bytes" + "fmt" + "os" + "json" + "http" + "net" + "io/ioutil" + "url" +) + +var def_hdrs = map[string][]string{} + +type buffer struct { + b *bytes.Buffer +} + +func (b *buffer) Read(out []byte) (int, os.Error) { + return b.b.Read(out) +} + +func (b *buffer) Close() os.Error { return nil } + +// Converts given URL to string containing the body of the response. +func url_to_buf(u string) []byte { + if r, err := http.Get(u); err == nil { + b, err := ioutil.ReadAll(r.Body) + r.Body.Close() + if err == nil { + return b + } + } + return make([]byte, 0) +} + +type IdAndRev struct { + Id string `json:"_id"` + Rev string `json:"_rev"` +} + +// Sends a query to CouchDB and parses the response back. +// method: the name of the HTTP method (POST, PUT,...) +// url: the URL to interact with +// headers: additional headers to pass to the request +// in: body of the request +// out: a structure to fill in with the returned JSON document +func (p Database) interact(method, u string, headers map[string][]string, in []byte, out interface{}) (int, os.Error) { + fullHeaders := map[string][]string{} + for k, v := range headers { + fullHeaders[k] = v + } + bodyLength := 0 + if in != nil { + bodyLength = len(in) + fullHeaders["Content-Type"] = []string{"application/json"} + } + req := http.Request{ + Method: method, + ProtoMajor: 1, + ProtoMinor: 1, + Close: true, + ContentLength: int64(bodyLength), + Header: fullHeaders, + } + req.TransferEncoding = []string{"chunked"} + req.URL, _ = url.Parse(u) + if in != nil { + req.Body = &buffer{bytes.NewBuffer(in)} + } + conn, err := net.Dial("tcp", fmt.Sprintf("%s:%s", p.Host, p.Port)) + if err != nil { + return 0, err + } + http_conn := http.NewClientConn(conn, nil) + defer http_conn.Close() + if err := http_conn.Write(&req); err != nil { + return 0, err + } + r, err := http_conn.Read(&req) + if err != nil { + return 0, err + } + if r.StatusCode < 200 || r.StatusCode >= 300 { + b := []byte{} + r.Body.Read(b) + return r.StatusCode, os.NewError("server said: " + r.Status) + } + decoder := json.NewDecoder(r.Body) + if err = decoder.Decode(out); err != nil { + return 0, err + } + r.Body.Close() + return r.StatusCode, nil +} + +type Database struct { + Host string + Port string + Name string +} + +func (p Database) BaseURL() string { + return fmt.Sprintf("http://%s:%s", p.Host, p.Port) +} + +func (p Database) DBURL() string { + return fmt.Sprintf("%s/%s", p.BaseURL(), p.Name) +} + +// Test whether CouchDB is running (ignores Database.Name) +func (p Database) Running() bool { + u := fmt.Sprintf("%s/%s", p.BaseURL(), "_all_dbs") + s := url_to_buf(u) + if len(s) > 0 { + return true + } + return false +} + +type database_info struct { + Db_name string + // other stuff too, ignore for now +} + +// Test whether specified database exists in specified CouchDB instance +func (p Database) Exists() bool { + di := new(database_info) + if err := json.Unmarshal(url_to_buf(p.DBURL()), di); err != nil { + return false + } + if di.Db_name != p.Name { + return false + } + return true +} + +func (p Database) create_database() os.Error { + ir := response{} + if _, err := p.interact("PUT", p.DBURL(), def_hdrs, nil, &ir); err != nil { + return err + } + if !ir.Ok { + return os.NewError("Create database operation returned not-OK") + } + return nil +} + +// Deletes the given database and all documents +func (p Database) DeleteDatabase() os.Error { + ir := response{} + if _, err := p.interact("DELETE", p.DBURL(), def_hdrs, nil, &ir); err != nil { + return err + } + if !ir.Ok { + return os.NewError("Delete database operation returned not-OK") + } + return nil +} + +func NewDatabase(host, port, name string) (Database, os.Error) { + db := Database{host, port, name} + if !db.Running() { + return db, os.NewError("CouchDB not running") + } + if !db.Exists() { + if err := db.create_database(); err != nil { + return db, err + } + } + return db, nil +} + +// Strip _id and _rev from d, returning them separately if they exist +func clean_JSON(d interface{}) (json_buf []byte, id, rev string, err os.Error) { + json_buf, err = json.Marshal(d) + if err != nil { + return + } + m := map[string]interface{}{} + err = json.Unmarshal(json_buf, &m) + if err != nil { + return + } + id_rev := new(IdAndRev) + err = json.Unmarshal(json_buf, &id_rev) + if err != nil { + return + } + if _, ok := m["_id"]; ok { + id = id_rev.Id + m["_id"] = nil, false + } + if _, ok := m["_rev"]; ok { + rev = id_rev.Rev + m["_rev"] = nil, false + } + json_buf, err = json.Marshal(m) + return +} + +type response struct { + Ok bool + Id string + Rev string + Error string + Reason string +} + +// Inserts document to CouchDB, returning id and rev on success. +// Document may specify both "_id" and "_rev" fields (will overwrite existing) +// or just "_id" (will use that id, but not overwrite existing) +// or neither (will use autogenerated id) +func (p Database) Insert(d interface{}) (string, string, os.Error) { + json_buf, id, rev, err := clean_JSON(d) + if err != nil { + return "", "", err + } + if id != "" && rev != "" { + new_rev, err2 := p.Edit(d) + return id, new_rev, err2 + } else if id != "" { + return p.insert_with(json_buf, id) + } else if id == "" { + return p.insert(json_buf) + } + return "", "", os.NewError("invalid Document") +} + +// Private implementation of simple autogenerated-id insert +func (p Database) insert(json_buf []byte) (string, string, os.Error) { + ir := response{} + if _, err := p.interact("POST", p.DBURL(), def_hdrs, json_buf, &ir); err != nil { + return "", "", err + } + if !ir.Ok { + return "", "", os.NewError(fmt.Sprintf("%s: %s", ir.Error, ir.Reason)) + } + return ir.Id, ir.Rev, nil +} + +// Inserts the given document (shouldn't contain "_id" or "_rev" tagged fields) +// using the passed 'id' as the _id. Will fail if the id already exists. +func (p Database) InsertWith(d interface{}, id string) (string, string, os.Error) { + json_buf, err := json.Marshal(d) + if err != nil { + return "", "", err + } + return p.insert_with(json_buf, id) +} + +// Private implementation of insert with given id +func (p Database) insert_with(json_buf []byte, id string) (string, string, os.Error) { + u := fmt.Sprintf("%s/%s", p.DBURL(), url.QueryEscape(id)) + ir := response{} + if _, err := p.interact("PUT", u, def_hdrs, json_buf, &ir); err != nil { + return "", "", err + } + if !ir.Ok { + return "", "", os.NewError(fmt.Sprintf("%s: %s", ir.Error, ir.Reason)) + } + return ir.Id, ir.Rev, nil +} + +// Edits the given document, returning the new revision. +// d must contain "_id" and "_rev" tagged fields. +func (p Database) Edit(d interface{}) (string, os.Error) { + json_buf, err := json.Marshal(d) + if err != nil { + return "", err + } + id_rev := new(IdAndRev) + err = json.Unmarshal(json_buf, id_rev) + if err != nil { + return "", err + } + if id_rev.Id == "" { + return "", os.NewError("Id not specified in interface") + } + if id_rev.Rev == "" { + return "", os.NewError("Rev not specified in interface (try InsertWith)") + } + u := fmt.Sprintf("%s/%s", p.DBURL(), url.QueryEscape(id_rev.Id)) + ir := response{} + if _, err = p.interact("PUT", u, def_hdrs, json_buf, &ir); err != nil { + return "", err + } + return ir.Rev, nil +} + +// Edits the given document, returning the new revision. +// d should not contain "_id" or "_rev" tagged fields. If it does, they will +// be overwritten with the passed values. +func (p Database) EditWith(d interface{}, id, rev string) (string, os.Error) { + if id == "" || rev == "" { + return "", os.NewError("EditWith: must specify both id and rev") + } + json_buf, err := json.Marshal(d) + if err != nil { + return "", err + } + m := map[string]interface{}{} + err = json.Unmarshal(json_buf, &m) + if err != nil { + return "", err + } + m["_id"] = id + m["_rev"] = rev + return p.Edit(m) +} + +// Unmarshals the document matching id to the given interface, returning rev. +func (p Database) Retrieve(id string, d interface{}) (string, os.Error) { + if id == "" { + return "", os.NewError("no id specified") + } + json_buf := url_to_buf(fmt.Sprintf("%s/%s", p.DBURL(), id)) + id_rev := new(IdAndRev) + if err := json.Unmarshal(json_buf, &id_rev); err != nil { + return "", err + } + if id_rev.Id != id { + return "", os.NewError("invalid id specified") + } + return id_rev.Rev, json.Unmarshal(json_buf, d) +} + +// Deletes document given by id and rev. +func (p Database) Delete(id, rev string) os.Error { + headers := map[string][]string{ + "If-Match": []string{rev}, + } + u := fmt.Sprintf("%s/%s", p.DBURL(), id) + ir := response{} + if _, err := p.interact("DELETE", u, headers, nil, &ir); err != nil { + return err + } + if !ir.Ok { + return os.NewError(fmt.Sprintf("%s: %s", ir.Error, ir.Reason)) + } + return nil +} + +type Row struct { + Id *string +} + +type keyed_view_response struct { + Total_rows uint64 + Offset uint64 + Rows []Row +} + +// Return array of document ids as returned by the given view/options combo. +// view should be eg. "_design/my_foo/_view/my_bar" +// options should be eg. { "limit": 10, "key": "baz" } +func (p Database) QueryIds(view string, options map[string]interface{}) ([]string, os.Error) { + kvr := new(keyed_view_response) + + if err := p.Query(view, options, kvr); err != nil { + fmt.Println("Query error: " + err.String()) + return make([]string, 0), err + } + ids := make([]string, len(kvr.Rows)) + i := 0 + for _, row := range kvr.Rows { + if row.Id != nil { + ids[i] = *row.Id + i++ + } + } + return ids[:i], nil +} + +func (p Database) Query(view string, options map[string]interface{}, results interface{}) os.Error { + if view == "" { + return os.NewError("empty view") + } + + var parameters string + for k, v := range options { + switch t := v.(type) { + case string: + parameters += fmt.Sprintf(`%s=%s&`, k, url.QueryEscape(t)) + case int: + parameters += fmt.Sprintf(`%s=%d&`, k, t) + case bool: + parameters += fmt.Sprintf(`%s=%v&`, k, t) + default: + // TODO more types are supported + panic(fmt.Sprintf("unsupported value-type %T in Query", t)) + } + } + full_url := fmt.Sprintf("%s/%s?%s", p.DBURL(), view, parameters) + json_buf := url_to_buf(full_url) + + if err := json.Unmarshal(json_buf, results); err != nil { + return err + } + return nil +} |