--- Log opened Fri Jan 03 00:00:12 2014 | ||
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 240 seconds] | 00:31 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 00:33 | |
-!- Viper168 [~Viper@unaffiliated/viper168] has joined ##hplusroadmap | 00:35 | |
-!- Viper168_ [~Viper@unaffiliated/viper168] has quit [Ping timeout: 264 seconds] | 00:37 | |
-!- Adifex [~Adifex@71-33-177-160.hlrn.qwest.net] has joined ##hplusroadmap | 00:43 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 246 seconds] | 00:45 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 00:58 | |
-!- justanotheruser [~justanoth@unaffiliated/justanotheruser] has quit [Ping timeout: 240 seconds] | 01:16 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 240 seconds] | 01:34 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 01:36 | |
-!- justanotheruser [~justanoth@95.211.191.41] has joined ##hplusroadmap | 01:39 | |
-!- justanotheruser [~justanoth@95.211.191.41] has quit [Changing host] | 01:39 | |
-!- justanotheruser [~justanoth@unaffiliated/justanotheruser] has joined ##hplusroadmap | 01:39 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 240 seconds] | 01:45 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.221.168] has joined ##hplusroadmap | 01:52 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.221.168] has quit [Max SendQ exceeded] | 01:56 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 01:58 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.221.168] has joined ##hplusroadmap | 01:59 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.221.168] has quit [Max SendQ exceeded] | 02:02 | |
-!- ElixirVitae [~Shehrazad@144.122.189.207] has joined ##hplusroadmap | 02:10 | |
-!- ElixirVitae [~Shehrazad@144.122.189.207] has quit [Changing host] | 02:10 | |
-!- ElixirVitae [~Shehrazad@unaffiliated/shehrazad] has joined ##hplusroadmap | 02:10 | |
-!- lichen [~lichen@c-50-139-11-6.hsd1.or.comcast.net] has joined ##hplusroadmap | 02:23 | |
-!- strangewarp_ [~strangewa@c-67-176-51-230.hsd1.co.comcast.net] has joined ##hplusroadmap | 02:33 | |
-!- strangewarp [~strangewa@c-67-176-51-230.hsd1.co.comcast.net] has quit [Ping timeout: 272 seconds] | 02:35 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Read error: Operation timed out] | 02:45 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 03:00 | |
-!- kyknos_ [~kyknos@89.233.130.143] has quit [Ping timeout: 240 seconds] | 03:01 | |
-!- EnLilaSko [EnLilaSko@unaffiliated/enlilasko] has joined ##hplusroadmap | 03:22 | |
-!- ElixirVitae [~Shehrazad@unaffiliated/shehrazad] has quit [Ping timeout: 264 seconds] | 03:37 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Read error: Operation timed out] | 03:46 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 03:58 | |
-!- ElixirVitae [~Shehrazad@unaffiliated/shehrazad] has joined ##hplusroadmap | 04:00 | |
-!- Adifex [~Adifex@71-33-177-160.hlrn.qwest.net] has quit [Quit: Just going out for a swim...] | 04:15 | |
-!- chris_99 [~chris_99@unaffiliated/chris-99/x-3062929] has joined ##hplusroadmap | 04:17 | |
-!- yorick [~yorick@oftn/member/yorick] has joined ##hplusroadmap | 04:32 | |
-!- Adifex [~Adifex@71-33-177-160.hlrn.qwest.net] has joined ##hplusroadmap | 04:39 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.219.54] has joined ##hplusroadmap | 04:46 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 246 seconds] | 04:47 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.219.54] has quit [Max SendQ exceeded] | 04:48 | |
-!- Adifex [~Adifex@71-33-177-160.hlrn.qwest.net] has quit [Quit: Just going out for a swim...] | 04:56 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 05:00 | |
-!- kyknos_ [kyknos@nat/novell/x-wplsbwyulqzhxzat] has joined ##hplusroadmap | 05:01 | |
-!- eudoxia [~eudoxia@r186-54-8-208.dialup.adsl.anteldata.net.uy] has joined ##hplusroadmap | 05:43 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Read error: Operation timed out] | 05:46 | |
-!- eudoxia [~eudoxia@r186-54-8-208.dialup.adsl.anteldata.net.uy] has quit [Read error: Connection reset by peer] | 05:50 | |
-!- lichen [~lichen@c-50-139-11-6.hsd1.or.comcast.net] has quit [Ping timeout: 240 seconds] | 05:52 | |
-!- lichen [~lichen@c-50-139-11-6.hsd1.or.comcast.net] has joined ##hplusroadmap | 05:53 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 06:01 | |
-!- eudoxia [~eudoxia@r186-52-63-141.dialup.adsl.anteldata.net.uy] has joined ##hplusroadmap | 06:06 | |
-!- klafka [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has quit [Remote host closed the connection] | 06:26 | |
-!- klafka [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has joined ##hplusroadmap | 06:26 | |
-!- klafka [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has quit [Ping timeout: 260 seconds] | 06:31 | |
-!- Viper168 [~Viper@unaffiliated/viper168] has quit [Ping timeout: 264 seconds] | 06:39 | |
-!- Viper168 [~Viper@unaffiliated/viper168] has joined ##hplusroadmap | 06:46 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 272 seconds] | 06:48 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has joined ##hplusroadmap | 06:50 | |
-!- ElixirVitae [~Shehrazad@unaffiliated/shehrazad] has quit [Quit: Leaving] | 06:59 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 07:01 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has quit [Ping timeout: 252 seconds] | 07:13 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.220.154] has joined ##hplusroadmap | 07:18 | |
-!- eudoxia [~eudoxia@r186-52-63-141.dialup.adsl.anteldata.net.uy] has quit [Quit: Leaving] | 07:25 | |
-!- pad2 [~not@100.43.114.90] has joined ##hplusroadmap | 07:30 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.220.154] has quit [Ping timeout: 246 seconds] | 07:31 | |
-!- Guest76816 [~not@100.43.114.90] has quit [Ping timeout: 246 seconds] | 07:33 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has joined ##hplusroadmap | 07:46 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 260 seconds] | 07:49 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has quit [Max SendQ exceeded] | 07:51 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has joined ##hplusroadmap | 07:53 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has quit [Excess Flood] | 07:55 | |
-!- rayston [~rayston@ip68-3-129-200.ph.ph.cox.net] has quit [Read error: Operation timed out] | 07:57 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 07:58 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has joined ##hplusroadmap | 07:58 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has quit [Max SendQ exceeded] | 08:02 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has joined ##hplusroadmap | 08:04 | |
-!- nsh [~nsh@host86-158-73-232.range86-158.btcentralplus.com] has joined ##hplusroadmap | 08:16 | |
-!- nsh [~nsh@host86-158-73-232.range86-158.btcentralplus.com] has quit [Changing host] | 08:16 | |
-!- nsh [~nsh@wikipedia/nsh] has joined ##hplusroadmap | 08:16 | |
-!- JayDugger [~jwdugger@pool-173-74-79-151.dllstx.fios.verizon.net] has quit [Quit: Leaving.] | 08:26 | |
-!- eudoxia [~eudoxia@r186-52-63-141.dialup.adsl.anteldata.net.uy] has joined ##hplusroadmap | 08:49 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 272 seconds] | 08:50 | |
kanzure | hrmm any thoughts on whether this contribution is worthwhile? https://github.com/kanzure/python-brlcad/pull/12/files#diff-2 | 08:58 |
---|---|---|
kanzure | i'm a little opposed to a .cfg file, it should probably just be .yaml | 08:58 |
-!- yorick [~yorick@oftn/member/yorick] has quit [Remote host closed the connection] | 09:02 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 09:04 | |
eudoxia | gradstudentbot, say something funny | 09:25 |
gradstudentbot | Dropped my sample. | 09:25 |
eudoxia | just rub it a little and put it back in the microscope noone will notice | 09:26 |
-!- aelinoea [~aelinoea@a88-113-45-152.elisa-laajakaista.fi] has joined ##hplusroadmap | 09:26 | |
-!- ThomasEgi [~thomas@185.5.8.81] has joined ##hplusroadmap | 09:31 | |
-!- ThomasEgi [~thomas@185.5.8.81] has quit [Changing host] | 09:31 | |
-!- ThomasEgi [~thomas@panda3d/ThomasEgi] has joined ##hplusroadmap | 09:31 | |
-!- eudoxia [~eudoxia@r186-52-63-141.dialup.adsl.anteldata.net.uy] has quit [Quit: Leaving] | 09:43 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 272 seconds] | 09:50 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 10:04 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 260 seconds] | 10:51 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 11:04 | |
kanzure | there should be a hardware site called hard fork | 11:08 |
-!- Adillian [~Adillian@94.9.98.141] has joined ##hplusroadmap | 11:13 | |
-!- strages [sid11297@gateway/web/irccloud.com/x-hszhmliqmagzmcro] has joined ##hplusroadmap | 11:40 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 260 seconds] | 11:51 | |
-!- entelechios [~elysium@181.194.139.149] has quit [Ping timeout: 240 seconds] | 12:00 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 12:04 | |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has quit [Read error: Connection reset by peer] | 12:17 | |
-!- klafka [~klafka@c-50-161-113-143.hsd1.ca.comcast.net] has joined ##hplusroadmap | 12:39 | |
-!- entelechios [~elysium@190.184.196.50] has joined ##hplusroadmap | 12:44 | |
-!- Viper168_ [~Viper@unaffiliated/viper168] has joined ##hplusroadmap | 12:49 | |
-!- Viper168 [~Viper@unaffiliated/viper168] has quit [Ping timeout: 245 seconds] | 12:50 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.222.47] has quit [Ping timeout: 252 seconds] | 12:52 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 272 seconds] | 12:53 | |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has joined ##hplusroadmap | 12:57 | |
-!- klafka_ [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has joined ##hplusroadmap | 12:59 | |
kyknos_ | paperbot: http://pubs.rsc.org/en/content/articlelanding/2013/sc/c3sc52928b/unauth#!divAbstract | 12:59 |
-!- klafka [~klafka@c-50-161-113-143.hsd1.ca.comcast.net] has quit [Ping timeout: 246 seconds] | 13:01 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 13:04 | |
paperbot | http://diyhpl.us/~bryan/papers2/paperbot/Photoscopy%3A%20Spectroscopic%20Information%20from%20Camera%20Snapshots%3F.pdf | 13:05 |
nmz787 | paperbot: http://dx.doi.org/10.1039/C3SC52928B | 13:13 |
katsmeow-afk | adobe won't open that | 13:13 |
kanzure | it's technically not a valid pdf | 13:14 |
kanzure | but also you shouldn't be using any adobe software because of how awful their track record is with security | 13:14 |
katsmeow-afk | yet it starts with %PDF-1.4 | 13:15 |
kanzure | pdfparanoia manipulates every incoming pdf file in a way that makes it a technically invalid pdf file | 13:15 |
ParahSailin | it doesnt have xref table | 13:15 |
kanzure | it should have an xref table but pdfparanoia makes the xref table probably wrong | 13:15 |
katsmeow-afk | :-/ | 13:15 |
katsmeow-afk | :-/ | 13:16 |
ParahSailin | it doesnt even endstream and endobj that last stream object | 13:16 |
kanzure | hrm that seems worthy of debugging | 13:16 |
ParahSailin | kanzure: dont worry about it | 13:16 |
kanzure | huh? | 13:17 |
kanzure | oh do you have your super secret haskell pdf parser-generator yet | 13:17 |
ParahSailin | almost done | 13:17 |
kanzure | i was being facetious, i dunno if you're actually writing one | 13:17 |
katsmeow-afk | what do you suggest i open the mangled pdf with? | 13:17 |
ParahSailin | its unopenable | 13:18 |
nmz787 | katsmeow-afk: http://diyhpl.us/~nmz787/pdf/Photoscopy_Spectroscopic_Information_from_Camera_Snapshots_.pdf | 13:18 |
kanzure | there are, apparently, other problems with that pdf | 13:18 |
nmz787 | it's because pdfparanoia is broken | 13:18 |
-!- FourFire [~fourfire@214-137-212.connect.netcom.no] has joined ##hplusroadmap | 13:18 | |
katsmeow-afk | then i am so glad we had this discussion | 13:18 |
nmz787 | and i never pushed my changes because i thought kanzure might want me to keep my GUI stuff separate | 13:18 |
ParahSailin | actually lemme see if adding the endstream fixes it | 13:18 |
nmz787 | the pdf i sent works | 13:18 |
paperbot | http://diyhpl.us/~bryan/papers2/paperbot/Photoscopy%3A%20Spectroscopic%20Information%20from%20Camera%20Snapshots%3F.pdf | 13:19 |
nmz787 | the manipulate command is broken | 13:19 |
katsmeow-afk | nmz is correct, and his file is 700k bigger | 13:19 |
ParahSailin | nope, the endstream and enobj dont fix it | 13:19 |
-!- klafka_ [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has quit [Read error: Connection reset by peer] | 13:19 | |
-!- klafka [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has joined ##hplusroadmap | 13:20 | |
nmz787 | it might be due to this function being broken https://github.com/kanzure/pdfparanoia/blob/master/pdfparanoia/eraser.py#L10 | 13:21 |
katsmeow-afk | nmz787 , the page caught my eye because i have collected a few Canon A530 for other photo reasons | 13:21 |
nmz787 | it always skips the first object | 13:21 |
ParahSailin | fatal error seems to be a /undefined in /BXlevel | 13:21 |
nmz787 | i wrote a fixed version, lemme upload it | 13:21 |
gradstudentbot | No, you definitely have a right to your own opinion. I just.. wish you wouldn't voice it. | 13:22 |
* katsmeow-afk unplugs gradstudentbot | 13:23 | |
gradstudentbot | Grant submitted. | 13:23 |
kanzure | nmz787: why is manipulate_pdf broken? | 13:27 |
kanzure | nmz787: why are you passive aggressively withholding code? | 13:27 |
kanzure | you're worried that i might say it could be better? big fucking deal... i often write terrible things that need to get fixed. | 13:27 |
uberj | paperbot: http://www.sciencedirect.com/science/article/pii/S0006291X0900134X | 13:28 |
paperbot | http://diyhpl.us/~bryan/papers2/paperbot/368b4b2b263eda204151cd1aebf2a490.txt | 13:28 |
nmz787 | no | 13:28 |
uberj | paperbot: you never work | 13:28 |
nmz787 | i'm just busy and hate github | 13:28 |
kanzure | uberj: feel free to fix the bug | 13:28 |
nmz787 | like now it's such a PITA to add code | 13:28 |
kanzure | paperbot: http://www.sciencedirect.com/science/article/pii/S0006291X0900134X/pdfft?md5=e4909f0ac890901cf45ef009c299a33c&pid=1-s2.0-S0006291X0900134X-main.pdf | 13:28 |
paperbot | http://diyhpl.us/~bryan/papers2/paperbot/6db31cc127ec1d0d85eabf725ac19e5a.pdf | 13:28 |
kanzure | uberj: there you go | 13:29 |
kanzure | man you guys all suck | 13:29 |
uberj | kanzure: ah, so I guess I'm not linking the right url | 13:29 |
kanzure | fix shit on your own i'm not going to always be around to fix bugs 4 seconds after you report it | 13:29 |
uberj | kanzure: where on the page did you find that url? | 13:30 |
uberj | in this case, paperbot isn't broken, its users are. | 13:31 |
kanzure | no, this is a paperbot bug | 13:31 |
kanzure | it's clearly in the html that paperbot returned to you | 13:31 |
uberj | gotcha | 13:32 |
nmz787 | kanzure: here is the working code https://github.com/nmz787/pdf-watermark-removal/blob/master/pdf-watermark-removal.py#L213 | 13:33 |
kanzure | you.. created a new repo? | 13:33 |
nmz787 | sure | 13:34 |
kanzure | argh this is a fucking flask server | 13:34 |
nmz787 | yep | 13:34 |
kanzure | separation of concerns *beats you with a stick* | 13:34 |
nmz787 | well i forked from pdfparanoia then stopped using that pdfparser because you weren't actually using it to write | 13:34 |
nmz787 | and the removal code you had was broken, and by writing the enumerate myself I elucidated how to properly write remove_object | 13:35 |
nmz787 | i did not however write any unit tests as I know you mentioned there arent any | 13:35 |
kanzure | i haven't mentioned anything about the lack of tests of pdf-watermark-removal.git ever | 13:36 |
nmz787 | as I stopped working on the javascript stuff because i needed to figure out the randomization of removing objects algorithm | 13:36 |
kanzure | i just learned about this repo 5 seconds ago | 13:36 |
nmz787 | you're forgetting i said i forked it from your code | 13:36 |
nmz787 | and you said you didn't have unit tests for the remove code | 13:36 |
nmz787 | in your code | 13:36 |
kanzure | i think that adding an entire web server is a huge mistake and that it limits the availability of this in other contexts. eg. it means that if paperbot uses it, it suddenly has to run wsgi stuff.. | 13:36 |
nmz787 | since this is basically the same with the addition of the image generation and flask stuf | 13:37 |
nmz787 | well it can be broken apart | 13:37 |
nmz787 | just easier to test with one file | 13:37 |
nmz787 | anyway, it's generating images nicely from PDF pages, so presenting them to the user with "is the watermark gone yes/no" is all that's left | 13:38 |
nmz787 | that binary search or whatever you mentioned | 13:39 |
gradstudentbot | Friends don't let friends go to super school. | 13:39 |
ParahSailin | http server for watermark removal? | 13:43 |
nmz787 | for learning a new publisher | 13:43 |
kanzure | the object id is going to be different between each pdf | 13:43 |
nmz787 | s/learning/training/ | 13:43 |
kanzure | it doesn't do that | 13:43 |
nmz787 | you told me the first thing was to find the object that needed removing | 13:43 |
kanzure | yes, so that you can write a plugin for pdfparanoia that searches for similar objects | 13:44 |
nmz787 | then you know what to search for content-wise in future | 13:44 |
nmz787 | i thought | 13:44 |
kanzure | just knowing the id is not enough | 13:44 |
kanzure | knowing the id is necessary for starting the process of reverse engineering | 13:44 |
-!- aelinoea [~aelinoea@a88-113-45-152.elisa-laajakaista.fi] has quit [Quit: Leaving] | 13:44 | |
nmz787 | nah i thought you'd search i nfuture with content of that object | 13:44 |
kanzure | the content is often obfuscated using whatever encodings that i probably don't know; often it's based on dimensions or geometry or coordinates | 13:45 |
kanzure | making a blocking http server for pdf watermark removal is really really bad. you should at least make it non-blocking, and then move all the watermark removal stuff into a separate module so that it's not dependent on wsgi/flask things. | 13:45 |
nmz787 | also, seems like you'd just have to do it for a few papers from that publisher to see what their watermark data was, do a diff between all the watermark objects you've collected | 13:46 |
kanzure | diffing the content of the watermark objects wont tell you much | 13:46 |
nmz787 | you also said with a binary search of removing objects you usually get it in 6-8 hits | 13:46 |
kanzure | i was talking about a manual process for starting the reverse engineering process | 13:47 |
nmz787 | so i am fine with doing that for each pdf i upload for now until we can get the training part working better | 13:47 |
nmz787 | for now even just for debug i think it's vaulable | 13:47 |
nmz787 | it wasn't very slow or anything | 13:47 |
ParahSailin | no, diff the same paper downloaded from different locations | 13:48 |
kanzure | ParahSailin: he's talking about something else.. | 13:48 |
kanzure | ParahSailin: he wants to create some svm thing for detecting the watermark objects based on 'training data sets' instead of the plugin approach where a programmer figures out how to remove the watermark | 13:48 |
nmz787 | sure, so the IP is different, so but hopefully they aren't encoding with error-correction | 13:48 |
nmz787 | i.e. nested interleaved data | 13:48 |
nmz787 | which i doubt they are using | 13:49 |
ParahSailin | dont really need to do something that wild to train detection | 13:49 |
kanzure | ParahSailin: otherwise i can't explain why he is using the word 'training' if he didn't mean machine learning.. | 13:49 |
nmz787 | so i'd think the IP section of the coding would be different, but the "You downloaded from Springer.com" wouldn't be | 13:49 |
nmz787 | svm? | 13:49 |
nmz787 | no way | 13:49 |
nmz787 | you told me that i should randomly remove objects til it was gone and my content wasnt | 13:50 |
kanzure | fuck you, learn to read | 13:50 |
nmz787 | so i made the function to get any pdf page | 13:50 |
nmz787 | as a png | 13:50 |
ParahSailin | removing entire objects is going to break many pdfs | 13:50 |
kanzure | yes | 13:50 |
ParahSailin | because often the watermark is part of the same stream as the content | 13:50 |
kanzure | i was explaining a manual process for identifying a watermark's object id | 13:50 |
kanzure | by a binary search of removing objects | 13:50 |
nmz787 | and i wanted to present to myself that image with a yes/no box, along with a count of the # of objects currently removed | 13:50 |
kanzure | and then once you find the id, you can identify how to find it more easily (geometry, size, placement, encoding, etc) | 13:51 |
ParahSailin | you just want to remove that particular BT ... ET section | 13:51 |
kanzure | i didn't tell you to randomly remove objects and the ncreate machine learning training data sets or whatever | 13:51 |
kanzure | *then | 13:51 |
nmz787 | i was under the assumption you just removed any object, since that's all pdfparanoia looked like it was doing | 13:52 |
nmz787 | in the plugins | 13:52 |
kanzure | it's removing a specific object | 13:52 |
kanzure | each plugin finds a very specific object | 13:52 |
nmz787 | there are no machine learning ANYTHING in my head with this project | 13:52 |
nmz787 | you segued onto that somehow but it's not me man | 13:52 |
kanzure | you keep saying 'training' and 'diff the watermarks' | 13:52 |
nmz787 | yes | 13:52 |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 245 seconds] | 13:52 | |
nmz787 | the difference should only be the IP address | 13:53 |
nmz787 | which is somehow encoded | 13:53 |
nmz787 | if it isn't using error-correction or encryption it will be surrounded by the same journal watermark text | 13:53 |
kanzure | what the hell does that have to do with making a flask server :( blaaaaah | 13:53 |
nmz787 | "you downloaded from Springer.com from IP 000.000.123.122 have a nice day | 13:53 |
nmz787 | " | 13:53 |
nmz787 | you're stuck on that | 13:54 |
ParahSailin | i think you should be happy that he pushed stuff onto github | 13:54 |
nmz787 | that's minimal | 13:54 |
kanzure | ParahSailin: or angry that he doesn't listen | 13:54 |
nmz787 | that's just how i wanted to connect to the user | 13:54 |
nmz787 | it's that you are going asperbers and not seeing my perspective | 13:54 |
kanzure | your user that is writing a pdfparanoia plugin? | 13:55 |
nmz787 | i don | 13:55 |
nmz787 | 't use nodeJS or any phantomJS or whatever | 13:55 |
kanzure | what does nodejs or phantomjs have to do with this now ? | 13:55 |
nmz787 | because that's what you'll suggest if i ask about displaying a PNG | 13:55 |
kanzure | you shouldn't be displaying a png in the first place! separation of concerns | 13:56 |
kanzure | just generate a png, and then a ui layer (whatever the user chooses or if another developer spits it up over http, fine) chooses | 13:56 |
-!- Adillian [~Adillian@94.9.98.141] has quit [Ping timeout: 240 seconds] | 13:56 | |
kanzure | s/) chooses/) displays/ | 13:56 |
nmz787 | i chose web UI layer | 13:56 |
kanzure | yeah and then you stuck all your pdf parsing code into the same thread | 13:56 |
nmz787 | and flask was like 20 lines of code i already had | 13:56 |
kanzure | as the request/response | 13:57 |
nmz787 | so very simple! | 13:57 |
nmz787 | you sucl | 13:57 |
kanzure | but it's also wrong and broken and forces everyone else who imports this file to use wsgi/flask | 13:57 |
nmz787 | k | 13:57 |
nmz787 | your coding help sucks | 13:57 |
nmz787 | you | 13:57 |
nmz787 | 're mean | 13:57 |
kanzure | what do you not understand about my suggestions? | 13:57 |
nmz787 | and rude | 13:57 |
kanzure | i disagree about my coding help sucking, maybe you can tell me what you don't understand or disagree with | 13:57 |
nmz787 | no | 13:58 |
kanzure | yes i'm mean and rude, i have every right to be given the previous conversation before today *plus* your continued actions | 13:58 |
nmz787 | I have a farmer to go help build a barn with | 13:58 |
nmz787 | I do more than just code | 13:58 |
nmz787 | you can't understand that | 13:58 |
nmz787 | you never have been able to understand why biologists can't use computers | 13:58 |
nmz787 | and you don't realize that i fall between them and you | 13:59 |
nmz787 | and you don't know how to see or understand my perspective | 13:59 |
nmz787 | maybe you are the one not thinking things through thorougly | 13:59 |
nmz787 | i wrote a bunch of code, I wasn't rude at all | 14:00 |
kanzure | code can be rude and do rude things :) | 14:00 |
nmz787 | I wanted to write a plugin but I couldn't understand it | 14:00 |
nmz787 | I found errors in your code | 14:00 |
nmz787 | I knew you wouldn't like flask so I didnt fork your code | 14:00 |
kanzure | i explained how it worked to you and you asked questions and then i clarified (not today) | 14:00 |
kanzure | i like flask just fine, for web servers | 14:01 |
nmz787 | sorry I lacked attribution to you | 14:01 |
nmz787 | you also know I wrote a flask server to receive pdfs from my browser | 14:01 |
kanzure | you found errors but you expected me to have 100% complete coverage of all of modern science, which is completely unreasonable. i also said i was filling to accept bugfixes and new features. | 14:01 |
nmz787 | and i've mentiond wanting to integrate watermark removal, so flask is no more overhead in my existing application | 14:02 |
kanzure | (i never advertised pdfparanoia as working across all known publishers) | 14:02 |
nmz787 | sorry i didn't attribute your codebase, ParahSailin too I guess and whoever else, I'll try to fix it but I have to go now. | 14:02 |
nmz787 | I just wanted to make things better. | 14:03 |
nmz787 | Sorry I tried. | 14:03 |
nmz787 | Do you blame me for being mad? | 14:03 |
katsmeow-afk | my dog, shhesh | 14:03 |
nmz787 | Sorry for that too, if so. | 14:03 |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 14:06 | |
-!- nsh [~nsh@wikipedia/nsh] has quit [Ping timeout: 260 seconds] | 14:09 | |
ParahSailin | nmz787: for future reference, its easiest to use gs and https://maemo.gitorious.org/maemo-pkg/ghostscript/source/38a0cb22a559ee2492ecf77be8361fcd30346a4a:toolbin/pdfinflt.ps to inflate a pdf then browse it in text editor | 14:13 |
-!- yorick [~yorick@oftn/member/yorick] has joined ##hplusroadmap | 14:13 | |
katsmeow-afk | nmz787 , would you know a glue that will stick to 2 liter pop bottle plastic? | 14:14 |
Qfwfq | ParahSailin: Good tip, thanks. | 14:16 |
kanzure | you should do the thing where you draw ids on each object instead of asking a user to do things over HTTP. then you just spit out a png and you can identify the ids on each page. | 14:17 |
-!- nsh [~nsh@host86-158-73-232.range86-158.btcentralplus.com] has joined ##hplusroadmap | 14:18 | |
katsmeow-afk | hmm, locktite construction adhesive | 14:25 |
kanzure | not the most useful visualization but whatevs http://binwalk.org/wp-content/uploads/2013/12/pdf_3d.gif | 14:44 |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 252 seconds] | 14:53 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 15:07 | |
FourFire | hello everyone | 15:23 |
FourFire | I'm feeling that my hardware is corrupted a lot today :( | 15:24 |
Dantespeaks | I just got a Core 2 quad at 2.33ghz, 4gb ram. and ive been using a Pentium 4. And this is a significant improvement. | 15:39 |
Dantespeaks | and i paid 130 bucks. yay! | 15:40 |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has quit [Read error: Connection reset by peer] | 15:48 | |
-!- Viper168_ [~Viper@unaffiliated/viper168] has quit [Ping timeout: 245 seconds] | 15:52 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Read error: Operation timed out] | 15:53 | |
-!- EnLilaSko [EnLilaSko@unaffiliated/enlilasko] has quit [Quit: - nbs-irc 2.39 - www.nbs-irc.net -] | 15:59 | |
FourFire | wooh | 16:03 |
FourFire | I'm hoping my i5 460m will arrive in the post real soon | 16:03 |
FourFire | I'm using a P4500 atm | 16:03 |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 16:07 | |
-!- drewbot [~cinch@ec2-54-224-203-27.compute-1.amazonaws.com] has quit [Remote host closed the connection] | 16:23 | |
-!- drewbot [~cinch@ec2-54-224-216-85.compute-1.amazonaws.com] has joined ##hplusroadmap | 16:24 | |
-!- Viper168 [~Viper@unaffiliated/viper168] has joined ##hplusroadmap | 16:25 | |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has joined ##hplusroadmap | 16:25 | |
-!- klafka [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has quit [Read error: Connection reset by peer] | 16:32 | |
-!- klafka [~klafka@c-24-6-18-31.hsd1.ca.comcast.net] has joined ##hplusroadmap | 16:33 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 260 seconds] | 16:54 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 17:08 | |
-!- chris_99 [~chris_99@unaffiliated/chris-99/x-3062929] has quit [Quit: Leaving] | 17:24 | |
-!- rayston [~rayston@ip68-3-129-200.ph.ph.cox.net] has joined ##hplusroadmap | 17:43 | |
-!- kyknos_ [kyknos@nat/novell/x-wplsbwyulqzhxzat] has quit [Ping timeout: 264 seconds] | 17:50 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 272 seconds] | 17:55 | |
-!- _Sol_ [~Sol@c-174-57-58-11.hsd1.pa.comcast.net] has quit [Read error: Connection reset by peer] | 17:59 | |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has quit [Quit: Try HydraIRC -> http://www.hydrairc.com <-] | 18:03 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 18:08 | |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has joined ##hplusroadmap | 18:26 | |
-!- yorick [~yorick@oftn/member/yorick] has quit [Remote host closed the connection] | 18:29 | |
-!- kyknos_ [~kyknos@89.233.130.143] has joined ##hplusroadmap | 18:39 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 260 seconds] | 18:56 | |
-!- Adifex [~Adifex@75-148-41-126-Colorado.hfc.comcastbusiness.net] has joined ##hplusroadmap | 19:04 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 19:09 | |
-!- yashgaroth [~ffffff@2606:6000:b240:8200:f533:a037:83b6:c75b] has joined ##hplusroadmap | 19:19 | |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has quit [Read error: Connection reset by peer] | 19:53 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 252 seconds] | 19:56 | |
-!- lichen [~lichen@c-50-139-11-6.hsd1.or.comcast.net] has quit [Quit: Lost terminal] | 19:59 | |
-!- oblique [~oblique@unaffiliated/oblique] has quit [Ping timeout: 245 seconds] | 20:00 | |
-!- pads [~not@100.43.114.90] has joined ##hplusroadmap | 20:00 | |
-!- oblique [~oblique@unaffiliated/oblique] has joined ##hplusroadmap | 20:00 | |
-!- pads is now known as Guest67409 | 20:01 | |
-!- pad2 [~not@100.43.114.90] has quit [Ping timeout: 265 seconds] | 20:03 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 20:10 | |
-!- Dantespeaks [~Dantespea@206-248-156-17.dsl.teksavvy.com] has joined ##hplusroadmap | 20:41 | |
-!- entelechios [~elysium@190.184.196.50] has quit [Ping timeout: 246 seconds] | 20:43 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 272 seconds] | 20:57 | |
-!- justanotheruser [~justanoth@unaffiliated/justanotheruser] has quit [Ping timeout: 240 seconds] | 21:03 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 21:10 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has joined ##hplusroadmap | 21:19 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has quit [Ping timeout: 252 seconds] | 21:24 | |
-!- yashgaroth [~ffffff@2606:6000:b240:8200:f533:a037:83b6:c75b] has quit [Quit: Leaving] | 21:31 | |
-!- justanotheruser [~justanoth@95.211.138.27] has joined ##hplusroadmap | 21:39 | |
-!- justanotheruser [~justanoth@95.211.138.27] has quit [Changing host] | 21:39 | |
-!- justanotheruser [~justanoth@unaffiliated/justanotheruser] has joined ##hplusroadmap | 21:39 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 252 seconds] | 21:57 | |
-!- entelechios [~elysium@181.194.139.149] has joined ##hplusroadmap | 21:59 | |
-!- Adifex [~Adifex@75-148-41-126-Colorado.hfc.comcastbusiness.net] has quit [Ping timeout: 260 seconds] | 22:03 | |
-!- Viper168 [~Viper@unaffiliated/viper168] has quit [Ping timeout: 272 seconds] | 22:05 | |
-!- Adifex [~Adifex@75-148-41-126-Colorado.hfc.comcastbusiness.net] has joined ##hplusroadmap | 22:06 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.216.21] has joined ##hplusroadmap | 22:09 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 22:11 | |
-!- kuldeepdhaka [~kuldeepdh@117.254.216.21] has quit [Max SendQ exceeded] | 22:13 | |
-!- justanotheruser1 [~justanoth@ip24-252-25-244.om.om.cox.net] has joined ##hplusroadmap | 22:14 | |
-!- justanotheruser [~justanoth@unaffiliated/justanotheruser] has quit [Ping timeout: 245 seconds] | 22:15 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has joined ##hplusroadmap | 22:18 | |
-!- justanotheruser1 [~justanoth@ip24-252-25-244.om.om.cox.net] has quit [Read error: Connection reset by peer] | 22:19 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has quit [Client Quit] | 22:22 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has joined ##hplusroadmap | 22:23 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has quit [Changing host] | 22:30 | |
-!- justanotheruser [~justanoth@unaffiliated/justanotheruser] has joined ##hplusroadmap | 22:30 | |
-!- justanotheruser [~justanoth@unaffiliated/justanotheruser] has quit [Ping timeout: 245 seconds] | 22:35 | |
-!- FourFire [~fourfire@214-137-212.connect.netcom.no] has quit [Quit: Leaving] | 22:41 | |
-!- Adifex is now known as Adifex[0] | 22:46 | |
-!- JayDugger [~jwdugger@pool-173-74-79-151.dllstx.fios.verizon.net] has joined ##hplusroadmap | 22:52 | |
-!- Viper168 [~Viper@unaffiliated/viper168] has joined ##hplusroadmap | 22:54 | |
-!- JayDugger [~jwdugger@pool-173-74-79-151.dllstx.fios.verizon.net] has quit [Ping timeout: 252 seconds] | 22:58 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 272 seconds] | 22:59 | |
-!- Adifex[0] [~Adifex@75-148-41-126-Colorado.hfc.comcastbusiness.net] has quit [Quit: Just going out for a swim...] | 23:00 | |
-!- JayDugger [~jwdugger@pool-173-74-79-151.dllstx.fios.verizon.net] has joined ##hplusroadmap | 23:05 | |
-!- ThomasEgi [~thomas@panda3d/ThomasEgi] has quit [Quit: ... disappearing in a puff of python magic] | 23:09 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has joined ##hplusroadmap | 23:11 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has joined ##hplusroadmap | 23:24 | |
-!- justanotheruser [~justanoth@ip24-252-25-244.om.om.cox.net] has quit [Ping timeout: 246 seconds] | 23:40 | |
-!- Daelus001 [~Daelus001@201-246-149-239.baf.movistar.cl] has joined ##hplusroadmap | 23:40 | |
-!- Adifex [~Adifex@75-148-41-126-Colorado.hfc.comcastbusiness.net] has joined ##hplusroadmap | 23:51 | |
-!- entelechios [~elysium@181.194.139.149] has quit [Ping timeout: 260 seconds] | 23:54 | |
-!- Adifex [~Adifex@75-148-41-126-Colorado.hfc.comcastbusiness.net] has quit [Client Quit] | 23:55 | |
-!- lupfantomo [~lupfantom@24-159-24-229.dhcp.jcsn.tn.charter.com] has quit [Ping timeout: 245 seconds] | 23:59 | |
--- Log closed Sat Jan 04 00:00:13 2014 |
Generated by irclog2html.py 2.15.0.dev0 by Marius Gedminas - find it at mg.pov.lt!